poca-SoccerTwos / run_logs /timers.json
guocheng66's picture
Second Push
8a152f0
{
"name": "root",
"gauges": {
"SoccerTwos.Policy.Entropy.mean": {
"value": 3.1824750900268555,
"min": 3.1547484397888184,
"max": 3.2956900596618652,
"count": 100
},
"SoccerTwos.Policy.Entropy.sum": {
"value": 88701.9453125,
"min": 23412.0703125,
"max": 114764.3203125,
"count": 100
},
"SoccerTwos.Environment.EpisodeLength.mean": {
"value": 860.5,
"min": 489.9,
"max": 999.0,
"count": 100
},
"SoccerTwos.Environment.EpisodeLength.sum": {
"value": 20652.0,
"min": 14644.0,
"max": 27616.0,
"count": 100
},
"SoccerTwos.Self-play.ELO.mean": {
"value": 1200.78991806887,
"min": 1197.0440605645447,
"max": 1207.1172065682176,
"count": 90
},
"SoccerTwos.Self-play.ELO.sum": {
"value": 4803.15967227548,
"min": 2394.0881211290894,
"max": 16784.708841766012,
"count": 90
},
"SoccerTwos.Step.mean": {
"value": 999684.0,
"min": 9824.0,
"max": 999684.0,
"count": 100
},
"SoccerTwos.Step.sum": {
"value": 999684.0,
"min": 9824.0,
"max": 999684.0,
"count": 100
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
"value": -0.00797598622739315,
"min": -0.036553021520376205,
"max": 0.05947311595082283,
"count": 100
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
"value": -0.0957118347287178,
"min": -0.438421368598938,
"max": 0.8325973749160767,
"count": 100
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
"value": -0.006179752293974161,
"min": -0.022581540048122406,
"max": 0.05948488041758537,
"count": 100
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
"value": -0.07415702939033508,
"min": -0.27457916736602783,
"max": 0.8327765464782715,
"count": 100
},
"SoccerTwos.Environment.CumulativeReward.mean": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 100
},
"SoccerTwos.Environment.CumulativeReward.sum": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 100
},
"SoccerTwos.Policy.ExtrinsicReward.mean": {
"value": -0.16666666666666666,
"min": -0.5860000000550196,
"max": 0.38087058768552895,
"count": 100
},
"SoccerTwos.Policy.ExtrinsicReward.sum": {
"value": -2.0,
"min": -8.0,
"max": 6.474799990653992,
"count": 100
},
"SoccerTwos.Environment.GroupCumulativeReward.mean": {
"value": -0.16666666666666666,
"min": -0.5860000000550196,
"max": 0.38087058768552895,
"count": 100
},
"SoccerTwos.Environment.GroupCumulativeReward.sum": {
"value": -2.0,
"min": -8.0,
"max": 6.474799990653992,
"count": 100
},
"SoccerTwos.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 100
},
"SoccerTwos.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 100
},
"SoccerTwos.Losses.PolicyLoss.mean": {
"value": 0.012221555140179892,
"min": 0.006795583742981156,
"max": 0.016645218633736174,
"count": 46
},
"SoccerTwos.Losses.PolicyLoss.sum": {
"value": 0.012221555140179892,
"min": 0.006795583742981156,
"max": 0.016645218633736174,
"count": 46
},
"SoccerTwos.Losses.ValueLoss.mean": {
"value": 0.003237667710830768,
"min": 8.194062053613985e-05,
"max": 0.01861500459102293,
"count": 46
},
"SoccerTwos.Losses.ValueLoss.sum": {
"value": 0.003237667710830768,
"min": 8.194062053613985e-05,
"max": 0.01861500459102293,
"count": 46
},
"SoccerTwos.Losses.BaselineLoss.mean": {
"value": 0.00324154964958628,
"min": 7.848465102142655e-05,
"max": 0.009435744381820162,
"count": 46
},
"SoccerTwos.Losses.BaselineLoss.sum": {
"value": 0.00324154964958628,
"min": 7.848465102142655e-05,
"max": 0.009435744381820162,
"count": 46
},
"SoccerTwos.Policy.LearningRate.mean": {
"value": 0.0006,
"min": 0.0006,
"max": 0.0006,
"count": 46
},
"SoccerTwos.Policy.LearningRate.sum": {
"value": 0.0006,
"min": 0.0006,
"max": 0.0006,
"count": 46
},
"SoccerTwos.Policy.Epsilon.mean": {
"value": 0.20000000000000007,
"min": 0.20000000000000007,
"max": 0.20000000000000007,
"count": 46
},
"SoccerTwos.Policy.Epsilon.sum": {
"value": 0.20000000000000007,
"min": 0.20000000000000007,
"max": 0.20000000000000007,
"count": 46
},
"SoccerTwos.Policy.Beta.mean": {
"value": 0.005,
"min": 0.005,
"max": 0.005,
"count": 46
},
"SoccerTwos.Policy.Beta.sum": {
"value": 0.005,
"min": 0.005,
"max": 0.005,
"count": 46
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1697686348",
"python_version": "3.10.12 (main, Jun 11 2023, 05:26:28) [GCC 11.4.0]",
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --force",
"mlagents_version": "1.1.0.dev0",
"mlagents_envs_version": "1.1.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "2.0.1+cu118",
"numpy_version": "1.23.5",
"end_time_seconds": "1697688565"
},
"total": 2217.164994551,
"count": 1,
"self": 0.4259129499996561,
"children": {
"run_training.setup": {
"total": 0.07464664500002982,
"count": 1,
"self": 0.07464664500002982
},
"TrainerController.start_learning": {
"total": 2216.664434956,
"count": 1,
"self": 1.6753877999994984,
"children": {
"TrainerController._reset_env": {
"total": 4.416130657000224,
"count": 5,
"self": 4.416130657000224
},
"TrainerController.advance": {
"total": 2210.3573846880004,
"count": 65069,
"self": 1.8022751490188966,
"children": {
"env_step": {
"total": 1823.0047769609614,
"count": 65069,
"self": 1406.1171325439245,
"children": {
"SubprocessEnvManager._take_step": {
"total": 415.8875872410355,
"count": 65069,
"self": 11.887741108043144,
"children": {
"TorchPolicy.evaluate": {
"total": 403.99984613299233,
"count": 129182,
"self": 403.99984613299233
}
}
},
"workers": {
"total": 1.0000571760013486,
"count": 65069,
"self": 0.0,
"children": {
"worker_root": {
"total": 2212.1702933349934,
"count": 65069,
"is_parallel": true,
"self": 1033.889048864969,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.0044236590000537035,
"count": 2,
"is_parallel": true,
"self": 0.0009960950001186575,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.003427563999935046,
"count": 8,
"is_parallel": true,
"self": 0.003427563999935046
}
}
},
"UnityEnvironment.step": {
"total": 0.0418704440000397,
"count": 1,
"is_parallel": true,
"self": 0.0012168680000286258,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.0008716350000099737,
"count": 1,
"is_parallel": true,
"self": 0.0008716350000099737
},
"communicator.exchange": {
"total": 0.035724202000039895,
"count": 1,
"is_parallel": true,
"self": 0.035724202000039895
},
"steps_from_proto": {
"total": 0.004057738999961202,
"count": 2,
"is_parallel": true,
"self": 0.0006634809998899982,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.003394258000071204,
"count": 8,
"is_parallel": true,
"self": 0.003394258000071204
}
}
}
}
}
}
},
"UnityEnvironment.step": {
"total": 1178.2684012030245,
"count": 65068,
"is_parallel": true,
"self": 75.30102161908849,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 49.89441047398384,
"count": 65068,
"is_parallel": true,
"self": 49.89441047398384
},
"communicator.exchange": {
"total": 818.6866904860156,
"count": 65068,
"is_parallel": true,
"self": 818.6866904860156
},
"steps_from_proto": {
"total": 234.38627862393668,
"count": 130136,
"is_parallel": true,
"self": 37.99782386399312,
"children": {
"_process_rank_one_or_two_observation": {
"total": 196.38845475994356,
"count": 520544,
"is_parallel": true,
"self": 196.38845475994356
}
}
}
}
},
"steps_from_proto": {
"total": 0.012843266999880143,
"count": 8,
"is_parallel": true,
"self": 0.002305757999351954,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.010537509000528189,
"count": 32,
"is_parallel": true,
"self": 0.010537509000528189
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 385.55033257802,
"count": 65069,
"self": 14.281712731008213,
"children": {
"process_trajectory": {
"total": 109.3654763670126,
"count": 65069,
"self": 108.84511364601275,
"children": {
"RLTrainer._checkpoint": {
"total": 0.5203627209998558,
"count": 2,
"self": 0.5203627209998558
}
}
},
"_update_policy": {
"total": 261.9031434799992,
"count": 46,
"self": 161.58336632699843,
"children": {
"TorchPOCAOptimizer.update": {
"total": 100.31977715300076,
"count": 690,
"self": 100.31977715300076
}
}
}
}
}
}
},
"trainer_threads": {
"total": 1.0740000107034575e-06,
"count": 1,
"self": 1.0740000107034575e-06
},
"TrainerController._save_models": {
"total": 0.2155307369998809,
"count": 1,
"self": 0.001797785000235308,
"children": {
"RLTrainer._checkpoint": {
"total": 0.2137329519996456,
"count": 1,
"self": 0.2137329519996456
}
}
}
}
}
}
}