poca-SoccerTwos / run_logs /timers.json
fortminors's picture
First Push
0faa616 verified
{
"name": "root",
"gauges": {
"SoccerTwos.Policy.Entropy.mean": {
"value": 3.1738739013671875,
"min": 3.1062047481536865,
"max": 3.295743465423584,
"count": 500
},
"SoccerTwos.Policy.Entropy.sum": {
"value": 57180.51171875,
"min": 10395.6015625,
"max": 134590.828125,
"count": 500
},
"SoccerTwos.Environment.EpisodeLength.mean": {
"value": 912.4,
"min": 418.1666666666667,
"max": 999.0,
"count": 500
},
"SoccerTwos.Environment.EpisodeLength.sum": {
"value": 18248.0,
"min": 13464.0,
"max": 28128.0,
"count": 500
},
"SoccerTwos.Self-play.ELO.mean": {
"value": 1186.7506137504733,
"min": 1178.8140551504239,
"max": 1212.5374376786385,
"count": 369
},
"SoccerTwos.Self-play.ELO.sum": {
"value": 2373.5012275009467,
"min": 2357.6281103008478,
"max": 26354.53280159907,
"count": 369
},
"SoccerTwos.Step.mean": {
"value": 4999264.0,
"min": 9870.0,
"max": 4999264.0,
"count": 500
},
"SoccerTwos.Step.sum": {
"value": 4999264.0,
"min": 9870.0,
"max": 4999264.0,
"count": 500
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
"value": -0.006986039690673351,
"min": -0.07708675414323807,
"max": 0.014412983320653439,
"count": 500
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
"value": -0.07684643566608429,
"min": -1.0792145729064941,
"max": 0.22211667895317078,
"count": 500
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
"value": -0.007536457385867834,
"min": -0.0770554170012474,
"max": 0.014517741277813911,
"count": 500
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
"value": -0.08290103077888489,
"min": -1.078758955001831,
"max": 0.20037278532981873,
"count": 500
},
"SoccerTwos.Environment.CumulativeReward.mean": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 500
},
"SoccerTwos.Environment.CumulativeReward.sum": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 500
},
"SoccerTwos.Policy.ExtrinsicReward.mean": {
"value": 0.0787272724238309,
"min": -0.5749111117588149,
"max": 0.34930909221822565,
"count": 500
},
"SoccerTwos.Policy.ExtrinsicReward.sum": {
"value": 0.8659999966621399,
"min": -10.348400011658669,
"max": 7.684800028800964,
"count": 500
},
"SoccerTwos.Environment.GroupCumulativeReward.mean": {
"value": 0.0787272724238309,
"min": -0.5749111117588149,
"max": 0.34930909221822565,
"count": 500
},
"SoccerTwos.Environment.GroupCumulativeReward.sum": {
"value": 0.8659999966621399,
"min": -10.348400011658669,
"max": 7.684800028800964,
"count": 500
},
"SoccerTwos.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 500
},
"SoccerTwos.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 500
},
"SoccerTwos.Losses.PolicyLoss.mean": {
"value": 0.012644073850970017,
"min": 0.010785335576413976,
"max": 0.023557618101282665,
"count": 232
},
"SoccerTwos.Losses.PolicyLoss.sum": {
"value": 0.012644073850970017,
"min": 0.010785335576413976,
"max": 0.023557618101282665,
"count": 232
},
"SoccerTwos.Losses.ValueLoss.mean": {
"value": 0.0008207118439410503,
"min": 2.665037854399088e-07,
"max": 0.010205822593222062,
"count": 232
},
"SoccerTwos.Losses.ValueLoss.sum": {
"value": 0.0008207118439410503,
"min": 2.665037854399088e-07,
"max": 0.010205822593222062,
"count": 232
},
"SoccerTwos.Losses.BaselineLoss.mean": {
"value": 0.0008186121189889188,
"min": 2.4038172057316843e-07,
"max": 0.010209519354005655,
"count": 232
},
"SoccerTwos.Losses.BaselineLoss.sum": {
"value": 0.0008186121189889188,
"min": 2.4038172057316843e-07,
"max": 0.010209519354005655,
"count": 232
},
"SoccerTwos.Policy.LearningRate.mean": {
"value": 0.0003,
"min": 0.0003,
"max": 0.0003,
"count": 232
},
"SoccerTwos.Policy.LearningRate.sum": {
"value": 0.0003,
"min": 0.0003,
"max": 0.0003,
"count": 232
},
"SoccerTwos.Policy.Epsilon.mean": {
"value": 0.20000000000000007,
"min": 0.2,
"max": 0.20000000000000007,
"count": 232
},
"SoccerTwos.Policy.Epsilon.sum": {
"value": 0.20000000000000007,
"min": 0.2,
"max": 0.20000000000000007,
"count": 232
},
"SoccerTwos.Policy.Beta.mean": {
"value": 0.005000000000000001,
"min": 0.005,
"max": 0.005000000000000001,
"count": 232
},
"SoccerTwos.Policy.Beta.sum": {
"value": 0.005000000000000001,
"min": 0.005,
"max": 0.005000000000000001,
"count": 232
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1724142155",
"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
"command_line_arguments": "/home/fortminors/miniconda3/envs/rl_course/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics",
"mlagents_version": "1.1.0.dev0",
"mlagents_envs_version": "1.1.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "2.4.0+cu121",
"numpy_version": "1.23.5",
"end_time_seconds": "1724144955"
},
"total": 2799.289504060056,
"count": 1,
"self": 0.1665385509841144,
"children": {
"run_training.setup": {
"total": 0.008161099161952734,
"count": 1,
"self": 0.008161099161952734
},
"TrainerController.start_learning": {
"total": 2799.11480440991,
"count": 1,
"self": 2.449658378493041,
"children": {
"TrainerController._reset_env": {
"total": 1.62942464184016,
"count": 25,
"self": 1.62942464184016
},
"TrainerController.advance": {
"total": 2794.9648115821183,
"count": 324971,
"self": 2.392891895957291,
"children": {
"env_step": {
"total": 2168.046913651284,
"count": 324971,
"self": 1635.4080960233696,
"children": {
"SubprocessEnvManager._take_step": {
"total": 531.147889896296,
"count": 324971,
"self": 19.13263945421204,
"children": {
"TorchPolicy.evaluate": {
"total": 512.0152504420839,
"count": 645152,
"self": 512.0152504420839
}
}
},
"workers": {
"total": 1.4909277316182852,
"count": 324971,
"self": 0.0,
"children": {
"worker_root": {
"total": 2795.6328543592244,
"count": 324971,
"is_parallel": true,
"self": 1475.3261391385458,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.0010009007528424263,
"count": 2,
"is_parallel": true,
"self": 0.00024868594482541084,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0007522148080170155,
"count": 8,
"is_parallel": true,
"self": 0.0007522148080170155
}
}
},
"UnityEnvironment.step": {
"total": 0.011439745780080557,
"count": 1,
"is_parallel": true,
"self": 0.00025154557079076767,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.0002005067653954029,
"count": 1,
"is_parallel": true,
"self": 0.0002005067653954029
},
"communicator.exchange": {
"total": 0.01031966507434845,
"count": 1,
"is_parallel": true,
"self": 0.01031966507434845
},
"steps_from_proto": {
"total": 0.0006680283695459366,
"count": 2,
"is_parallel": true,
"self": 0.00013251090422272682,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0005355174653232098,
"count": 8,
"is_parallel": true,
"self": 0.0005355174653232098
}
}
}
}
}
}
},
"UnityEnvironment.step": {
"total": 1320.2894980795681,
"count": 324970,
"is_parallel": true,
"self": 75.44282341795042,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 45.88406424270943,
"count": 324970,
"is_parallel": true,
"self": 45.88406424270943
},
"communicator.exchange": {
"total": 998.7209436986595,
"count": 324970,
"is_parallel": true,
"self": 998.7209436986595
},
"steps_from_proto": {
"total": 200.24166672024876,
"count": 649940,
"is_parallel": true,
"self": 35.716151917818934,
"children": {
"_process_rank_one_or_two_observation": {
"total": 164.52551480242983,
"count": 2599760,
"is_parallel": true,
"self": 164.52551480242983
}
}
}
}
},
"steps_from_proto": {
"total": 0.01721714111045003,
"count": 48,
"is_parallel": true,
"self": 0.0032692006789147854,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.013947940431535244,
"count": 192,
"is_parallel": true,
"self": 0.013947940431535244
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 624.5250060348772,
"count": 324971,
"self": 26.96057178778574,
"children": {
"process_trajectory": {
"total": 169.41629069950432,
"count": 324971,
"self": 168.63483696151525,
"children": {
"RLTrainer._checkpoint": {
"total": 0.781453737989068,
"count": 10,
"self": 0.781453737989068
}
}
},
"_update_policy": {
"total": 428.1481435475871,
"count": 232,
"self": 236.68582352017984,
"children": {
"TorchPOCAOptimizer.update": {
"total": 191.46232002740726,
"count": 6963,
"self": 191.46232002740726
}
}
}
}
}
}
},
"trainer_threads": {
"total": 5.052424967288971e-07,
"count": 1,
"self": 5.052424967288971e-07
},
"TrainerController._save_models": {
"total": 0.0709093022160232,
"count": 1,
"self": 0.0007661245763301849,
"children": {
"RLTrainer._checkpoint": {
"total": 0.07014317763969302,
"count": 1,
"self": 0.07014317763969302
}
}
}
}
}
}
}