manuu01 commited on
Commit
1eee028
1 Parent(s): 82cfeb0

Update_agent

Browse files
SoccerTwos.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:be68a1d27f55cf586f88ee45afa6d916c4f7a2ca602ed6690ea3b25c06d3b7b6
3
  size 886472
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15c0b0766c20d8adf80b92670d12210393aa05d57139e2d52f1a2b38ef385cd1
3
  size 886472
SoccerTwos/SoccerTwos-10499932.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a759cf86cc7e33e7faa9d18bf94c54e74bc532e92dcb88cd4b71fed731d3abe5
3
+ size 886472
SoccerTwos/SoccerTwos-10499932.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac432283cff4ae617cdab6301070d89776a272850addfe41d587ae82b8100ca9
3
+ size 10303217
SoccerTwos/SoccerTwos-10999982.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd5c8d24666045c60e620b78790c4e0c31cf02ee9eca4cd907d95c624c2455b1
3
+ size 886472
SoccerTwos/SoccerTwos-10999982.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a63591188c5c4dfa1f9dd0e0cf2a6dfef5ef1e7e4b8b125731ba04e7541cfd7
3
+ size 10303217
SoccerTwos/SoccerTwos-11397816.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15c0b0766c20d8adf80b92670d12210393aa05d57139e2d52f1a2b38ef385cd1
3
+ size 886472
SoccerTwos/SoccerTwos-11397816.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:514bef70703dc8232cd4b3496e2aa862f971df83174690e02a8d585a5e0c6bf1
3
+ size 10303217
SoccerTwos/checkpoint.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:631c93e41924164b6d4fe209dd7e74520a46159b919af6a137f6a66c94f0778b
3
  size 10303217
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:514bef70703dc8232cd4b3496e2aa862f971df83174690e02a8d585a5e0c6bf1
3
  size 10303217
SoccerTwos/events.out.tfevents.1691328393.51fdecdbc575.29941.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66789dc83a882d79a20de24418ec2592f9811bb9354e76899a36288a60c0134f
3
+ size 1429890
run_logs/Player-0.log CHANGED
@@ -31,7 +31,7 @@ ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM default
31
  FMOD failed to initialize the output device.: "Error initializing output device. " (60)
32
  FMOD initialized on nosound output
33
  Begin MonoManager ReloadAssembly
34
- - Completed reload, in 0.235 seconds
35
  ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
36
  ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
37
  ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
@@ -56,7 +56,7 @@ ERROR: Shader Standard shader is not supported on this GPU (none of subshaders/f
56
  WARNING: Shader Unsupported: 'Standard' - All subshaders removed
57
  WARNING: Shader Did you use #pragma only_renderers and omit this platform?
58
  WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
59
- UnloadTime: 7.297608 ms
60
  Registered Communicator in Agent.
61
  ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
62
  requesting resize 84 x 84
@@ -65,7 +65,7 @@ Memory Statistics:
65
  [ALLOC_TEMP_TLS] TLS Allocator
66
  StackAllocators :
67
  [ALLOC_TEMP_MAIN]
68
- Peak usage frame count: [8.0 KB-16.0 KB]: 26251 frames, [2.0 MB-4.0 MB]: 1 frames
69
  Initial Block Size 4.0 MB
70
  Current Block Size 4.0 MB
71
  Peak Allocated Bytes 2.1 MB
@@ -181,22 +181,22 @@ Memory Statistics:
181
  Peak Allocated Bytes 0 B
182
  Overflow Count 0
183
  [ALLOC_DEFAULT] Dual Thread Allocator
184
- Peak main deferred allocation count 3
185
  [ALLOC_BUCKET]
186
  Large Block size 4.0 MB
187
  Used Block count 1
188
  Peak Allocated bytes 1.0 MB
189
  [ALLOC_DEFAULT_MAIN]
190
- Peak usage frame count: [4.0 MB-8.0 MB]: 26252 frames
191
  Requested Block Size 16.0 MB
192
  Peak Block count 1
193
- Peak Allocated memory 4.6 MB
194
  Peak Large allocation bytes 0 B
195
  [ALLOC_DEFAULT_THREAD]
196
- Peak usage frame count: [16.0 MB-32.0 MB]: 26252 frames
197
  Requested Block Size 16.0 MB
198
  Peak Block count 1
199
- Peak Allocated memory 17.6 MB
200
  Peak Large allocation bytes 16.0 MB
201
  [ALLOC_TEMP_JOB_1_FRAME]
202
  Initial Block Size 2.0 MB
@@ -225,13 +225,13 @@ Memory Statistics:
225
  Used Block count 1
226
  Peak Allocated bytes 1.0 MB
227
  [ALLOC_GFX_MAIN]
228
- Peak usage frame count: [32.0 KB-64.0 KB]: 26251 frames, [64.0 KB-128.0 KB]: 1 frames
229
  Requested Block Size 16.0 MB
230
  Peak Block count 1
231
  Peak Allocated memory 65.6 KB
232
  Peak Large allocation bytes 0 B
233
  [ALLOC_GFX_THREAD]
234
- Peak usage frame count: [128.0 KB-256.0 KB]: 26252 frames
235
  Requested Block Size 16.0 MB
236
  Peak Block count 1
237
  Peak Allocated memory 173.5 KB
@@ -243,16 +243,16 @@ Memory Statistics:
243
  Used Block count 1
244
  Peak Allocated bytes 1.0 MB
245
  [ALLOC_CACHEOBJECTS_MAIN]
246
- Peak usage frame count: [0.5 MB-1.0 MB]: 26252 frames
247
  Requested Block Size 4.0 MB
248
  Peak Block count 1
249
  Peak Allocated memory 0.6 MB
250
  Peak Large allocation bytes 0 B
251
  [ALLOC_CACHEOBJECTS_THREAD]
252
- Peak usage frame count: [0.5 MB-1.0 MB]: 26251 frames, [4.0 MB-8.0 MB]: 1 frames
253
  Requested Block Size 4.0 MB
254
  Peak Block count 2
255
- Peak Allocated memory 4.4 MB
256
  Peak Large allocation bytes 0 B
257
  [ALLOC_TYPETREE] Dual Thread Allocator
258
  Peak main deferred allocation count 0
@@ -261,13 +261,13 @@ Memory Statistics:
261
  Used Block count 1
262
  Peak Allocated bytes 1.0 MB
263
  [ALLOC_TYPETREE_MAIN]
264
- Peak usage frame count: [0-1.0 KB]: 26252 frames
265
  Requested Block Size 2.0 MB
266
  Peak Block count 1
267
  Peak Allocated memory 1.0 KB
268
  Peak Large allocation bytes 0 B
269
  [ALLOC_TYPETREE_THREAD]
270
- Peak usage frame count: [1.0 KB-2.0 KB]: 26251 frames, [2.0 KB-4.0 KB]: 1 frames
271
  Requested Block Size 2.0 MB
272
  Peak Block count 1
273
  Peak Allocated memory 2.2 KB
 
31
  FMOD failed to initialize the output device.: "Error initializing output device. " (60)
32
  FMOD initialized on nosound output
33
  Begin MonoManager ReloadAssembly
34
+ - Completed reload, in 0.135 seconds
35
  ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
36
  ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
37
  ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 
56
  WARNING: Shader Unsupported: 'Standard' - All subshaders removed
57
  WARNING: Shader Did you use #pragma only_renderers and omit this platform?
58
  WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
59
+ UnloadTime: 1.127789 ms
60
  Registered Communicator in Agent.
61
  ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
62
  requesting resize 84 x 84
 
65
  [ALLOC_TEMP_TLS] TLS Allocator
66
  StackAllocators :
67
  [ALLOC_TEMP_MAIN]
68
+ Peak usage frame count: [8.0 KB-16.0 KB]: 26275 frames, [2.0 MB-4.0 MB]: 1 frames
69
  Initial Block Size 4.0 MB
70
  Current Block Size 4.0 MB
71
  Peak Allocated Bytes 2.1 MB
 
181
  Peak Allocated Bytes 0 B
182
  Overflow Count 0
183
  [ALLOC_DEFAULT] Dual Thread Allocator
184
+ Peak main deferred allocation count 4
185
  [ALLOC_BUCKET]
186
  Large Block size 4.0 MB
187
  Used Block count 1
188
  Peak Allocated bytes 1.0 MB
189
  [ALLOC_DEFAULT_MAIN]
190
+ Peak usage frame count: [4.0 MB-8.0 MB]: 26276 frames
191
  Requested Block Size 16.0 MB
192
  Peak Block count 1
193
+ Peak Allocated memory 5.2 MB
194
  Peak Large allocation bytes 0 B
195
  [ALLOC_DEFAULT_THREAD]
196
+ Peak usage frame count: [16.0 MB-32.0 MB]: 26276 frames
197
  Requested Block Size 16.0 MB
198
  Peak Block count 1
199
+ Peak Allocated memory 17.0 MB
200
  Peak Large allocation bytes 16.0 MB
201
  [ALLOC_TEMP_JOB_1_FRAME]
202
  Initial Block Size 2.0 MB
 
225
  Used Block count 1
226
  Peak Allocated bytes 1.0 MB
227
  [ALLOC_GFX_MAIN]
228
+ Peak usage frame count: [32.0 KB-64.0 KB]: 26275 frames, [64.0 KB-128.0 KB]: 1 frames
229
  Requested Block Size 16.0 MB
230
  Peak Block count 1
231
  Peak Allocated memory 65.6 KB
232
  Peak Large allocation bytes 0 B
233
  [ALLOC_GFX_THREAD]
234
+ Peak usage frame count: [128.0 KB-256.0 KB]: 26276 frames
235
  Requested Block Size 16.0 MB
236
  Peak Block count 1
237
  Peak Allocated memory 173.5 KB
 
243
  Used Block count 1
244
  Peak Allocated bytes 1.0 MB
245
  [ALLOC_CACHEOBJECTS_MAIN]
246
+ Peak usage frame count: [0.5 MB-1.0 MB]: 26276 frames
247
  Requested Block Size 4.0 MB
248
  Peak Block count 1
249
  Peak Allocated memory 0.6 MB
250
  Peak Large allocation bytes 0 B
251
  [ALLOC_CACHEOBJECTS_THREAD]
252
+ Peak usage frame count: [0.5 MB-1.0 MB]: 26275 frames, [2.0 MB-4.0 MB]: 1 frames
253
  Requested Block Size 4.0 MB
254
  Peak Block count 2
255
+ Peak Allocated memory 4.0 MB
256
  Peak Large allocation bytes 0 B
257
  [ALLOC_TYPETREE] Dual Thread Allocator
258
  Peak main deferred allocation count 0
 
261
  Used Block count 1
262
  Peak Allocated bytes 1.0 MB
263
  [ALLOC_TYPETREE_MAIN]
264
+ Peak usage frame count: [0-1.0 KB]: 26276 frames
265
  Requested Block Size 2.0 MB
266
  Peak Block count 1
267
  Peak Allocated memory 1.0 KB
268
  Peak Large allocation bytes 0 B
269
  [ALLOC_TYPETREE_THREAD]
270
+ Peak usage frame count: [1.0 KB-2.0 KB]: 26275 frames, [2.0 KB-4.0 KB]: 1 frames
271
  Requested Block Size 2.0 MB
272
  Peak Block count 1
273
  Peak Allocated memory 2.2 KB
run_logs/timers.json CHANGED
@@ -2,75 +2,87 @@
2
  "name": "root",
3
  "gauges": {
4
  "SoccerTwos.Policy.Entropy.mean": {
5
- "value": 2.0817551612854004,
6
- "min": 2.050828218460083,
7
- "max": 2.275116205215454,
8
- "count": 139
9
  },
10
  "SoccerTwos.Policy.Entropy.sum": {
11
- "value": 42900.8125,
12
- "min": 39650.84375,
13
- "max": 50390.9765625,
14
- "count": 139
15
  },
16
  "SoccerTwos.Environment.EpisodeLength.mean": {
17
- "value": 39.314516129032256,
18
- "min": 33.28082191780822,
19
- "max": 57.25581395348837,
20
- "count": 139
21
  },
22
  "SoccerTwos.Environment.EpisodeLength.sum": {
23
- "value": 19500.0,
24
- "min": 16104.0,
25
- "max": 20308.0,
26
- "count": 139
27
  },
28
  "SoccerTwos.Self-play.ELO.mean": {
29
- "value": 1514.2101837328041,
30
- "min": 1476.4009957931617,
31
- "max": 1527.4014633986794,
32
- "count": 139
33
  },
34
  "SoccerTwos.Self-play.ELO.sum": {
35
- "value": 375524.12556573545,
36
- "min": 256817.66796581444,
37
- "max": 441113.2119379982,
38
- "count": 139
 
 
 
 
 
 
 
 
 
 
 
 
39
  },
40
  "SoccerTwos.Step.mean": {
41
- "value": 10339990.0,
42
- "min": 8959951.0,
43
- "max": 10339990.0,
44
  "count": 139
45
  },
46
  "SoccerTwos.Step.sum": {
47
- "value": 10339990.0,
48
- "min": 8959951.0,
49
- "max": 10339990.0,
50
  "count": 139
51
  },
52
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
53
- "value": 0.01461908221244812,
54
- "min": -0.04508669674396515,
55
- "max": 0.06564339250326157,
56
  "count": 139
57
  },
58
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
59
- "value": 3.6109132766723633,
60
- "min": -9.310239791870117,
61
- "max": 16.082632064819336,
62
  "count": 139
63
  },
64
  "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
65
- "value": 0.015170346014201641,
66
- "min": -0.04868944361805916,
67
- "max": 0.06690935045480728,
68
  "count": 139
69
  },
70
  "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
71
- "value": 3.7470755577087402,
72
- "min": -9.785125732421875,
73
- "max": 16.198457717895508,
74
  "count": 139
75
  },
76
  "SoccerTwos.Environment.CumulativeReward.mean": {
@@ -86,75 +98,63 @@
86
  "count": 139
87
  },
88
  "SoccerTwos.Policy.ExtrinsicReward.mean": {
89
- "value": 0.014383805908172237,
90
- "min": -0.1816229159012437,
91
- "max": 0.21367312527963245,
92
  "count": 139
93
  },
94
  "SoccerTwos.Policy.ExtrinsicReward.sum": {
95
- "value": 3.5528000593185425,
96
- "min": -36.445600390434265,
97
- "max": 48.50379943847656,
98
  "count": 139
99
  },
100
  "SoccerTwos.Environment.GroupCumulativeReward.mean": {
101
- "value": 0.014383805908172237,
102
- "min": -0.1816229159012437,
103
- "max": 0.21367312527963245,
104
  "count": 139
105
  },
106
  "SoccerTwos.Environment.GroupCumulativeReward.sum": {
107
- "value": 3.5528000593185425,
108
- "min": -36.445600390434265,
109
- "max": 48.50379943847656,
110
- "count": 139
111
- },
112
- "SoccerTwos.IsTraining.mean": {
113
- "value": 1.0,
114
- "min": 1.0,
115
- "max": 1.0,
116
- "count": 139
117
- },
118
- "SoccerTwos.IsTraining.sum": {
119
- "value": 1.0,
120
- "min": 1.0,
121
- "max": 1.0,
122
  "count": 139
123
  },
124
  "SoccerTwos.Losses.PolicyLoss.mean": {
125
- "value": 0.014852080177903796,
126
- "min": 0.009855266399487543,
127
- "max": 0.022194832651378723,
128
  "count": 67
129
  },
130
  "SoccerTwos.Losses.PolicyLoss.sum": {
131
- "value": 0.014852080177903796,
132
- "min": 0.009855266399487543,
133
- "max": 0.022194832651378723,
134
  "count": 67
135
  },
136
  "SoccerTwos.Losses.ValueLoss.mean": {
137
- "value": 0.08246669918298721,
138
- "min": 0.07240680480996768,
139
- "max": 0.0872135025759538,
140
  "count": 67
141
  },
142
  "SoccerTwos.Losses.ValueLoss.sum": {
143
- "value": 0.08246669918298721,
144
- "min": 0.07240680480996768,
145
- "max": 0.0872135025759538,
146
  "count": 67
147
  },
148
  "SoccerTwos.Losses.BaselineLoss.mean": {
149
- "value": 0.08406391814351082,
150
- "min": 0.07332472875714302,
151
- "max": 0.08962557539343834,
152
  "count": 67
153
  },
154
  "SoccerTwos.Losses.BaselineLoss.sum": {
155
- "value": 0.08406391814351082,
156
- "min": 0.07332472875714302,
157
- "max": 0.08962557539343834,
158
  "count": 67
159
  },
160
  "SoccerTwos.Policy.LearningRate.mean": {
@@ -196,7 +196,7 @@
196
  },
197
  "metadata": {
198
  "timer_format_version": "0.1.0",
199
- "start_time_seconds": "1691323071",
200
  "python_version": "3.10.12 (main, Jun 11 2023, 05:26:28) [GCC 11.4.0]",
201
  "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --resume --torch-device=cpu",
202
  "mlagents_version": "0.31.0.dev0",
@@ -204,59 +204,59 @@
204
  "communication_protocol_version": "1.5.0",
205
  "pytorch_version": "1.11.0+cu102",
206
  "numpy_version": "1.21.2",
207
- "end_time_seconds": "1691328379"
208
  },
209
- "total": 5307.499628232,
210
  "count": 1,
211
- "self": 0.5378562470004908,
212
  "children": {
213
  "run_training.setup": {
214
- "total": 0.06018139100001463,
215
  "count": 1,
216
- "self": 0.06018139100001463
217
  },
218
  "TrainerController.start_learning": {
219
- "total": 5306.901590594,
220
  "count": 1,
221
- "self": 3.954543449065568,
222
  "children": {
223
  "TrainerController._reset_env": {
224
- "total": 1.757532165000839,
225
  "count": 8,
226
- "self": 1.757532165000839
227
  },
228
  "TrainerController.advance": {
229
- "total": 5301.185609296934,
230
- "count": 99781,
231
- "self": 4.008114537936308,
232
  "children": {
233
  "env_step": {
234
- "total": 2931.331986786951,
235
- "count": 99781,
236
- "self": 2508.7911618191483,
237
  "children": {
238
  "SubprocessEnvManager._take_step": {
239
- "total": 420.3306268819065,
240
- "count": 99781,
241
- "self": 18.73769292570705,
242
  "children": {
243
  "TorchPolicy.evaluate": {
244
- "total": 401.59293395619943,
245
- "count": 175010,
246
- "self": 401.59293395619943
247
  }
248
  }
249
  },
250
  "workers": {
251
- "total": 2.2101980858960815,
252
- "count": 99780,
253
  "self": 0.0,
254
  "children": {
255
  "worker_root": {
256
- "total": 5284.2023605070735,
257
- "count": 99780,
258
  "is_parallel": true,
259
- "self": 3188.8961787200533,
260
  "children": {
261
  "run_training.setup": {
262
  "total": 0.0,
@@ -265,48 +265,48 @@
265
  "self": 0.0,
266
  "children": {
267
  "steps_from_proto": {
268
- "total": 0.004170569000052637,
269
  "count": 2,
270
  "is_parallel": true,
271
- "self": 0.0011218869999538583,
272
  "children": {
273
  "_process_rank_one_or_two_observation": {
274
- "total": 0.003048682000098779,
275
  "count": 8,
276
  "is_parallel": true,
277
- "self": 0.003048682000098779
278
  }
279
  }
280
  },
281
  "UnityEnvironment.step": {
282
- "total": 0.04688210699987394,
283
  "count": 1,
284
  "is_parallel": true,
285
- "self": 0.0013496169997324614,
286
  "children": {
287
  "UnityEnvironment._generate_step_input": {
288
- "total": 0.0006175339999572316,
289
  "count": 1,
290
  "is_parallel": true,
291
- "self": 0.0006175339999572316
292
  },
293
  "communicator.exchange": {
294
- "total": 0.040462964000198554,
295
  "count": 1,
296
  "is_parallel": true,
297
- "self": 0.040462964000198554
298
  },
299
  "steps_from_proto": {
300
- "total": 0.004451991999985694,
301
  "count": 2,
302
  "is_parallel": true,
303
- "self": 0.0008053609999478795,
304
  "children": {
305
  "_process_rank_one_or_two_observation": {
306
- "total": 0.0036466310000378144,
307
  "count": 8,
308
  "is_parallel": true,
309
- "self": 0.0036466310000378144
310
  }
311
  }
312
  }
@@ -315,48 +315,48 @@
315
  }
316
  },
317
  "steps_from_proto": {
318
- "total": 0.019279038001741355,
319
  "count": 14,
320
  "is_parallel": true,
321
- "self": 0.0034742869997899106,
322
  "children": {
323
  "_process_rank_one_or_two_observation": {
324
- "total": 0.015804751001951445,
325
  "count": 56,
326
  "is_parallel": true,
327
- "self": 0.015804751001951445
328
  }
329
  }
330
  },
331
  "UnityEnvironment.step": {
332
- "total": 2095.2869027490187,
333
- "count": 99779,
334
  "is_parallel": true,
335
- "self": 125.02009742788687,
336
  "children": {
337
  "UnityEnvironment._generate_step_input": {
338
- "total": 64.16027218404838,
339
- "count": 99779,
340
  "is_parallel": true,
341
- "self": 64.16027218404838
342
  },
343
  "communicator.exchange": {
344
- "total": 1498.7004830649933,
345
- "count": 99779,
346
  "is_parallel": true,
347
- "self": 1498.7004830649933
348
  },
349
  "steps_from_proto": {
350
- "total": 407.40605007209024,
351
- "count": 199558,
352
  "is_parallel": true,
353
- "self": 72.04748076905344,
354
  "children": {
355
  "_process_rank_one_or_two_observation": {
356
- "total": 335.3585693030368,
357
- "count": 798232,
358
  "is_parallel": true,
359
- "self": 335.3585693030368
360
  }
361
  }
362
  }
@@ -369,31 +369,31 @@
369
  }
370
  },
371
  "trainer_advance": {
372
- "total": 2365.8455079720466,
373
- "count": 99780,
374
- "self": 25.670958199969846,
375
  "children": {
376
  "process_trajectory": {
377
- "total": 507.6338691290741,
378
- "count": 99780,
379
- "self": 506.59619934807483,
380
  "children": {
381
  "RLTrainer._checkpoint": {
382
- "total": 1.0376697809992947,
383
  "count": 3,
384
- "self": 1.0376697809992947
385
  }
386
  }
387
  },
388
  "_update_policy": {
389
- "total": 1832.5406806430028,
390
- "count": 67,
391
- "self": 356.4519601630159,
392
  "children": {
393
  "TorchPOCAOptimizer.update": {
394
- "total": 1476.088720479987,
395
- "count": 2010,
396
- "self": 1476.088720479987
397
  }
398
  }
399
  }
@@ -402,19 +402,19 @@
402
  }
403
  },
404
  "trainer_threads": {
405
- "total": 1.538999640615657e-06,
406
  "count": 1,
407
- "self": 1.538999640615657e-06
408
  },
409
  "TrainerController._save_models": {
410
- "total": 0.0039041439995344263,
411
  "count": 1,
412
- "self": 6.911199943715474e-05,
413
  "children": {
414
  "RLTrainer._checkpoint": {
415
- "total": 0.0038350320000972715,
416
  "count": 1,
417
- "self": 0.0038350320000972715
418
  }
419
  }
420
  }
 
2
  "name": "root",
3
  "gauges": {
4
  "SoccerTwos.Policy.Entropy.mean": {
5
+ "value": 2.064077615737915,
6
+ "min": 1.9721202850341797,
7
+ "max": 2.2204861640930176,
8
+ "count": 140
9
  },
10
  "SoccerTwos.Policy.Entropy.sum": {
11
+ "value": 40554.99609375,
12
+ "min": 1009.7255859375,
13
+ "max": 46868.6640625,
14
+ "count": 140
15
  },
16
  "SoccerTwos.Environment.EpisodeLength.mean": {
17
+ "value": 42.35964912280702,
18
+ "min": 14.0,
19
+ "max": 50.28865979381443,
20
+ "count": 140
21
  },
22
  "SoccerTwos.Environment.EpisodeLength.sum": {
23
+ "value": 19316.0,
24
+ "min": 56.0,
25
+ "max": 20672.0,
26
+ "count": 140
27
  },
28
  "SoccerTwos.Self-play.ELO.mean": {
29
+ "value": 1495.341597534808,
30
+ "min": 1479.5228480829521,
31
+ "max": 1555.2513011464291,
32
+ "count": 140
33
  },
34
  "SoccerTwos.Self-play.ELO.sum": {
35
+ "value": 340937.88423793623,
36
+ "min": 3019.393197996907,
37
+ "max": 406628.1923216918,
38
+ "count": 140
39
+ },
40
+ "SoccerTwos.IsTraining.mean": {
41
+ "value": 1.0,
42
+ "min": 1.0,
43
+ "max": 1.0,
44
+ "count": 140
45
+ },
46
+ "SoccerTwos.IsTraining.sum": {
47
+ "value": 1.0,
48
+ "min": 1.0,
49
+ "max": 1.0,
50
+ "count": 140
51
  },
52
  "SoccerTwos.Step.mean": {
53
+ "value": 11389982.0,
54
+ "min": 10009986.0,
55
+ "max": 11389982.0,
56
  "count": 139
57
  },
58
  "SoccerTwos.Step.sum": {
59
+ "value": 11389982.0,
60
+ "min": 10009986.0,
61
+ "max": 11389982.0,
62
  "count": 139
63
  },
64
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
65
+ "value": 0.018466472625732422,
66
+ "min": -0.0826631560921669,
67
+ "max": 0.08379679918289185,
68
  "count": 139
69
  },
70
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
71
+ "value": 4.210355758666992,
72
+ "min": -19.01252555847168,
73
+ "max": 18.016311645507812,
74
  "count": 139
75
  },
76
  "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
77
+ "value": 0.022079264745116234,
78
+ "min": -0.08283711969852448,
79
+ "max": 0.08470716327428818,
80
  "count": 139
81
  },
82
  "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
83
+ "value": 5.034072399139404,
84
+ "min": -19.05253791809082,
85
+ "max": 18.212039947509766,
86
  "count": 139
87
  },
88
  "SoccerTwos.Environment.CumulativeReward.mean": {
 
98
  "count": 139
99
  },
100
  "SoccerTwos.Policy.ExtrinsicReward.mean": {
101
+ "value": 0.013108772666830765,
102
+ "min": -0.29112212425839584,
103
+ "max": 0.30266069535592305,
104
  "count": 139
105
  },
106
  "SoccerTwos.Policy.ExtrinsicReward.sum": {
107
+ "value": 2.9888001680374146,
108
+ "min": -65.79360008239746,
109
+ "max": 60.83479976654053,
110
  "count": 139
111
  },
112
  "SoccerTwos.Environment.GroupCumulativeReward.mean": {
113
+ "value": 0.013108772666830765,
114
+ "min": -0.29112212425839584,
115
+ "max": 0.30266069535592305,
116
  "count": 139
117
  },
118
  "SoccerTwos.Environment.GroupCumulativeReward.sum": {
119
+ "value": 2.9888001680374146,
120
+ "min": -65.79360008239746,
121
+ "max": 60.83479976654053,
 
 
 
 
 
 
 
 
 
 
 
 
122
  "count": 139
123
  },
124
  "SoccerTwos.Losses.PolicyLoss.mean": {
125
+ "value": 0.019926921123017867,
126
+ "min": 0.008833187571144662,
127
+ "max": 0.021963592153042555,
128
  "count": 67
129
  },
130
  "SoccerTwos.Losses.PolicyLoss.sum": {
131
+ "value": 0.019926921123017867,
132
+ "min": 0.008833187571144662,
133
+ "max": 0.021963592153042555,
134
  "count": 67
135
  },
136
  "SoccerTwos.Losses.ValueLoss.mean": {
137
+ "value": 0.08703152487675349,
138
+ "min": 0.07363507027427356,
139
+ "max": 0.09096993108590444,
140
  "count": 67
141
  },
142
  "SoccerTwos.Losses.ValueLoss.sum": {
143
+ "value": 0.08703152487675349,
144
+ "min": 0.07363507027427356,
145
+ "max": 0.09096993108590444,
146
  "count": 67
147
  },
148
  "SoccerTwos.Losses.BaselineLoss.mean": {
149
+ "value": 0.08892411440610885,
150
+ "min": 0.07475643530488014,
151
+ "max": 0.09255644927422206,
152
  "count": 67
153
  },
154
  "SoccerTwos.Losses.BaselineLoss.sum": {
155
+ "value": 0.08892411440610885,
156
+ "min": 0.07475643530488014,
157
+ "max": 0.09255644927422206,
158
  "count": 67
159
  },
160
  "SoccerTwos.Policy.LearningRate.mean": {
 
196
  },
197
  "metadata": {
198
  "timer_format_version": "0.1.0",
199
+ "start_time_seconds": "1691328390",
200
  "python_version": "3.10.12 (main, Jun 11 2023, 05:26:28) [GCC 11.4.0]",
201
  "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --resume --torch-device=cpu",
202
  "mlagents_version": "0.31.0.dev0",
 
204
  "communication_protocol_version": "1.5.0",
205
  "pytorch_version": "1.11.0+cu102",
206
  "numpy_version": "1.21.2",
207
+ "end_time_seconds": "1691333783"
208
  },
209
+ "total": 5393.545187022,
210
  "count": 1,
211
+ "self": 0.011667517999740085,
212
  "children": {
213
  "run_training.setup": {
214
+ "total": 0.07663645400043606,
215
  "count": 1,
216
+ "self": 0.07663645400043606
217
  },
218
  "TrainerController.start_learning": {
219
+ "total": 5393.45688305,
220
  "count": 1,
221
+ "self": 4.0113200330524705,
222
  "children": {
223
  "TrainerController._reset_env": {
224
+ "total": 4.206497418999788,
225
  "count": 8,
226
+ "self": 4.206497418999788
227
  },
228
  "TrainerController.advance": {
229
+ "total": 5384.80390978495,
230
+ "count": 100295,
231
+ "self": 4.056981303214343,
232
  "children": {
233
  "env_step": {
234
+ "total": 2984.7628137827132,
235
+ "count": 100295,
236
+ "self": 2555.438939750102,
237
  "children": {
238
  "SubprocessEnvManager._take_step": {
239
+ "total": 426.984713441444,
240
+ "count": 100295,
241
+ "self": 18.920596326604027,
242
  "children": {
243
  "TorchPolicy.evaluate": {
244
+ "total": 408.06411711484,
245
+ "count": 175170,
246
+ "self": 408.06411711484
247
  }
248
  }
249
  },
250
  "workers": {
251
+ "total": 2.339160591167456,
252
+ "count": 100295,
253
  "self": 0.0,
254
  "children": {
255
  "worker_root": {
256
+ "total": 5364.331135505195,
257
+ "count": 100295,
258
  "is_parallel": true,
259
+ "self": 3235.772959452249,
260
  "children": {
261
  "run_training.setup": {
262
  "total": 0.0,
 
265
  "self": 0.0,
266
  "children": {
267
  "steps_from_proto": {
268
+ "total": 0.026826493000044138,
269
  "count": 2,
270
  "is_parallel": true,
271
+ "self": 0.011697553999511001,
272
  "children": {
273
  "_process_rank_one_or_two_observation": {
274
+ "total": 0.015128939000533137,
275
  "count": 8,
276
  "is_parallel": true,
277
+ "self": 0.015128939000533137
278
  }
279
  }
280
  },
281
  "UnityEnvironment.step": {
282
+ "total": 0.12830688400026702,
283
  "count": 1,
284
  "is_parallel": true,
285
+ "self": 0.00149898600011511,
286
  "children": {
287
  "UnityEnvironment._generate_step_input": {
288
+ "total": 0.0009528390000923537,
289
  "count": 1,
290
  "is_parallel": true,
291
+ "self": 0.0009528390000923537
292
  },
293
  "communicator.exchange": {
294
+ "total": 0.12143531600031565,
295
  "count": 1,
296
  "is_parallel": true,
297
+ "self": 0.12143531600031565
298
  },
299
  "steps_from_proto": {
300
+ "total": 0.004419742999743903,
301
  "count": 2,
302
  "is_parallel": true,
303
+ "self": 0.000816295999356953,
304
  "children": {
305
  "_process_rank_one_or_two_observation": {
306
+ "total": 0.00360344700038695,
307
  "count": 8,
308
  "is_parallel": true,
309
+ "self": 0.00360344700038695
310
  }
311
  }
312
  }
 
315
  }
316
  },
317
  "steps_from_proto": {
318
+ "total": 0.031148086000939657,
319
  "count": 14,
320
  "is_parallel": true,
321
+ "self": 0.009768344001713558,
322
  "children": {
323
  "_process_rank_one_or_two_observation": {
324
+ "total": 0.0213797419992261,
325
  "count": 56,
326
  "is_parallel": true,
327
+ "self": 0.0213797419992261
328
  }
329
  }
330
  },
331
  "UnityEnvironment.step": {
332
+ "total": 2128.527027966945,
333
+ "count": 100294,
334
  "is_parallel": true,
335
+ "self": 125.7653667474824,
336
  "children": {
337
  "UnityEnvironment._generate_step_input": {
338
+ "total": 66.86405879619542,
339
+ "count": 100294,
340
  "is_parallel": true,
341
+ "self": 66.86405879619542
342
  },
343
  "communicator.exchange": {
344
+ "total": 1523.5743622309183,
345
+ "count": 100294,
346
  "is_parallel": true,
347
+ "self": 1523.5743622309183
348
  },
349
  "steps_from_proto": {
350
+ "total": 412.32324019234875,
351
+ "count": 200588,
352
  "is_parallel": true,
353
+ "self": 73.06807255982676,
354
  "children": {
355
  "_process_rank_one_or_two_observation": {
356
+ "total": 339.255167632522,
357
+ "count": 802352,
358
  "is_parallel": true,
359
+ "self": 339.255167632522
360
  }
361
  }
362
  }
 
369
  }
370
  },
371
  "trainer_advance": {
372
+ "total": 2395.984114699022,
373
+ "count": 100295,
374
+ "self": 25.40969510305149,
375
  "children": {
376
  "process_trajectory": {
377
+ "total": 516.8834398569752,
378
+ "count": 100295,
379
+ "self": 515.9829564609745,
380
  "children": {
381
  "RLTrainer._checkpoint": {
382
+ "total": 0.900483396000709,
383
  "count": 3,
384
+ "self": 0.900483396000709
385
  }
386
  }
387
  },
388
  "_update_policy": {
389
+ "total": 1853.6909797389953,
390
+ "count": 68,
391
+ "self": 352.6695557349776,
392
  "children": {
393
  "TorchPOCAOptimizer.update": {
394
+ "total": 1501.0214240040177,
395
+ "count": 2017,
396
+ "self": 1501.0214240040177
397
  }
398
  }
399
  }
 
402
  }
403
  },
404
  "trainer_threads": {
405
+ "total": 1.9689996406668797e-06,
406
  "count": 1,
407
+ "self": 1.9689996406668797e-06
408
  },
409
  "TrainerController._save_models": {
410
+ "total": 0.43515384399870527,
411
  "count": 1,
412
+ "self": 0.0031298809990403242,
413
  "children": {
414
  "RLTrainer._checkpoint": {
415
+ "total": 0.43202396299966495,
416
  "count": 1,
417
+ "self": 0.43202396299966495
418
  }
419
  }
420
  }
run_logs/training_status.json CHANGED
@@ -2,59 +2,59 @@
2
  "SoccerTwos": {
3
  "checkpoints": [
4
  {
5
- "steps": 8500054,
6
- "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-8500054.onnx",
7
  "reward": 0.0,
8
- "creation_time": 1690985799.4838839,
9
  "auxillary_file_paths": [
10
- "results/SoccerTwos/SoccerTwos/SoccerTwos-8500054.pt"
11
  ]
12
  },
13
  {
14
- "steps": 8951810,
15
- "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-8951810.onnx",
16
- "reward": 0.0,
17
- "creation_time": 1691323056.1832547,
18
  "auxillary_file_paths": [
19
- "results/SoccerTwos/SoccerTwos/SoccerTwos-8951810.pt"
20
  ]
21
  },
22
  {
23
- "steps": 8999993,
24
- "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-8999993.onnx",
25
  "reward": 0.0,
26
- "creation_time": 1691323250.2108784,
27
  "auxillary_file_paths": [
28
- "results/SoccerTwos/SoccerTwos/SoccerTwos-8999993.pt"
29
  ]
30
  },
31
  {
32
- "steps": 9499966,
33
- "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-9499966.onnx",
34
  "reward": 0.0,
35
- "creation_time": 1691325176.6160336,
36
  "auxillary_file_paths": [
37
- "results/SoccerTwos/SoccerTwos/SoccerTwos-9499966.pt"
38
  ]
39
  },
40
  {
41
- "steps": 9999992,
42
- "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-9999992.onnx",
43
- "reward": 0.0,
44
- "creation_time": 1691327051.966959,
45
  "auxillary_file_paths": [
46
- "results/SoccerTwos/SoccerTwos/SoccerTwos-9999992.pt"
47
  ]
48
  }
49
  ],
50
- "elo": 1508.9473185543081,
51
  "final_checkpoint": {
52
- "steps": 8951810,
53
  "file_path": "results/SoccerTwos/SoccerTwos.onnx",
54
- "reward": 0.0,
55
- "creation_time": 1691323056.1832547,
56
  "auxillary_file_paths": [
57
- "results/SoccerTwos/SoccerTwos/SoccerTwos-8951810.pt"
58
  ]
59
  }
60
  },
 
2
  "SoccerTwos": {
3
  "checkpoints": [
4
  {
5
+ "steps": 9999992,
6
+ "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-9999992.onnx",
7
  "reward": 0.0,
8
+ "creation_time": 1691327051.966959,
9
  "auxillary_file_paths": [
10
+ "results/SoccerTwos/SoccerTwos/SoccerTwos-9999992.pt"
11
  ]
12
  },
13
  {
14
+ "steps": 9999992,
15
+ "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-9999992.onnx",
16
+ "reward": null,
17
+ "creation_time": 1691328396.2647002,
18
  "auxillary_file_paths": [
19
+ "results/SoccerTwos/SoccerTwos/SoccerTwos-9999992.pt"
20
  ]
21
  },
22
  {
23
+ "steps": 10499932,
24
+ "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-10499932.onnx",
25
  "reward": 0.0,
26
+ "creation_time": 1691330319.251756,
27
  "auxillary_file_paths": [
28
+ "results/SoccerTwos/SoccerTwos/SoccerTwos-10499932.pt"
29
  ]
30
  },
31
  {
32
+ "steps": 10999982,
33
+ "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-10999982.onnx",
34
  "reward": 0.0,
35
+ "creation_time": 1691332245.249486,
36
  "auxillary_file_paths": [
37
+ "results/SoccerTwos/SoccerTwos/SoccerTwos-10999982.pt"
38
  ]
39
  },
40
  {
41
+ "steps": 11397816,
42
+ "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-11397816.onnx",
43
+ "reward": null,
44
+ "creation_time": 1691333783.8306155,
45
  "auxillary_file_paths": [
46
+ "results/SoccerTwos/SoccerTwos/SoccerTwos-11397816.pt"
47
  ]
48
  }
49
  ],
50
+ "elo": 1500.167190622134,
51
  "final_checkpoint": {
52
+ "steps": 11397816,
53
  "file_path": "results/SoccerTwos/SoccerTwos.onnx",
54
+ "reward": null,
55
+ "creation_time": 1691333783.8306155,
56
  "auxillary_file_paths": [
57
+ "results/SoccerTwos/SoccerTwos/SoccerTwos-11397816.pt"
58
  ]
59
  }
60
  },