nlamot commited on
Commit
5c58095
1 Parent(s): a39b693

5M steps, increased learning rate with linear scheduler

Browse files
SoccerTwos.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a927605bab3756880322ffbd82591e17b9bb154c4fdfc7aa53dec2b81fee87f6
3
  size 1768747
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8171b9f22f3de0dfac49f68c4df948d5cda20dc11b6a2d73b5e244d153896472
3
  size 1768747
SoccerTwos/SoccerTwos-3499990.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53f40873d5390b4f523c95fc167e4b6e1cef2c2d6e19be275f7f026ba0ae53be
3
+ size 1768747
SoccerTwos/SoccerTwos-3499990.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53624c57bd7bd02e1b93d99843f9ab552bd414561ad8bde5506456b170726264
3
+ size 28430358
SoccerTwos/SoccerTwos-3999988.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ee7944532872486f1b57c530c1c53e1c20fe5ad038b7e57d0825b24f0d3f030
3
+ size 1768747
SoccerTwos/SoccerTwos-3999988.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:898d2e3151f633fc67f4a768874fac685fbf912ba93e0f1bb7dba1a48b292994
3
+ size 28430358
SoccerTwos/SoccerTwos-4499985.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a069f767798732937b0ef8a83ee0455b175fe805b479fece70ece051a56a8746
3
+ size 1768747
SoccerTwos/SoccerTwos-4499985.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5bfc75a2b680e1048d6fb76b860c5faad46dd965cde640a14b3bd61badc0dee
3
+ size 28430358
SoccerTwos/SoccerTwos-4999972.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8171b9f22f3de0dfac49f68c4df948d5cda20dc11b6a2d73b5e244d153896472
3
+ size 1768747
SoccerTwos/SoccerTwos-4999972.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f9baa0ff638555050fea9bd46515cf5d23335f5f978bb7d4403a56726907844
3
+ size 28430358
SoccerTwos/SoccerTwos-5000376.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8171b9f22f3de0dfac49f68c4df948d5cda20dc11b6a2d73b5e244d153896472
3
+ size 1768747
SoccerTwos/SoccerTwos-5000376.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32c3920c0b57d2ed7866fd28964c598624be7d4afd1fdc3e5019d8310c1bb00b
3
+ size 28430358
SoccerTwos/checkpoint.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1e9770185d2047554a219e6bc1797189e286d95b1f64eebe9cecf9b2ce127d76
3
  size 28429366
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:722fe59ebe4db88e2dd4d2191dfc0ba389035dbf97e91c45a728de4768562749
3
  size 28429366
SoccerTwos/events.out.tfevents.1703848765.nilss-mbp.lan.62191.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:957cee33c212d35c435af44dedc2e16d5b6c65963df108e63c326080cf90a00a
3
+ size 4771353
config.json CHANGED
@@ -1 +1 @@
1
- {"default_settings": null, "behaviors": {"SoccerTwos": {"trainer_type": "poca", "hyperparameters": {"batch_size": 2048, "buffer_size": 20480, "learning_rate": 0.0005, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 500000, "network_settings": {"normalize": false, "hidden_units": 512, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 5, "even_checkpoints": false, "max_steps": 50000000, "time_horizon": 1000, "summary_freq": 10000, "threaded": false, "self_play": {"save_steps": 50000, "team_change": 250000, "swap_steps": 2000, "window": 10, "play_against_latest_model_ratio": 0.5, "initial_elo": 1200.0}, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/SoccerTwos.app", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SoccerTwos", "initialize_from": null, "load_model": false, "resume": false, "force": true, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}
 
1
+ {"default_settings": null, "behaviors": {"SoccerTwos": {"trainer_type": "poca", "hyperparameters": {"batch_size": 2048, "buffer_size": 20480, "learning_rate": 0.0005, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 500000, "network_settings": {"normalize": false, "hidden_units": 512, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 5, "even_checkpoints": false, "max_steps": 5000000, "time_horizon": 1000, "summary_freq": 10000, "threaded": false, "self_play": {"save_steps": 50000, "team_change": 250000, "swap_steps": 2000, "window": 10, "play_against_latest_model_ratio": 0.5, "initial_elo": 1200.0}, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/SoccerTwos.app", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SoccerTwos", "initialize_from": null, "load_model": false, "resume": false, "force": true, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}
configuration.yaml CHANGED
@@ -37,7 +37,7 @@ behaviors:
37
  init_path: null
38
  keep_checkpoints: 5
39
  even_checkpoints: false
40
- max_steps: 50000000
41
  time_horizon: 1000
42
  summary_freq: 10000
43
  threaded: false
 
37
  init_path: null
38
  keep_checkpoints: 5
39
  even_checkpoints: false
40
+ max_steps: 5000000
41
  time_horizon: 1000
42
  summary_freq: 10000
43
  threaded: false
run_logs/Player-0.log CHANGED
@@ -10,7 +10,7 @@ NullGfxDevice:
10
  Renderer: Null Device
11
  Vendor: Unity Technologies
12
  Begin MonoManager ReloadAssembly
13
- - Completed reload, in 0.033 seconds
14
  ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
15
  ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
16
  ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
@@ -35,7 +35,7 @@ ERROR: Shader Standard shader is not supported on this GPU (none of subshaders/f
35
  WARNING: Shader Unsupported: 'Standard' - All subshaders removed
36
  WARNING: Shader Did you use #pragma only_renderers and omit this platform?
37
  WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
38
- UnloadTime: 0.190958 ms
39
  Registered Communicator in Agent.
40
  ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
41
  TOO LONG
@@ -290,13 +290,259 @@ TOO LONG
290
  TOO LONG
291
  TOO LONG
292
  TOO LONG
293
- Thread 0x16f507000 may have been prematurely finalized
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
294
  Setting up 6 worker threads for Enlighten.
295
  Memory Statistics:
296
  [ALLOC_TEMP_TLS] TLS Allocator
297
  StackAllocators :
298
  [ALLOC_TEMP_MAIN]
299
- Peak usage frame count: [8.0 KB-16.0 KB]: 327785 frames, [2.0 MB-4.0 MB]: 1 frames
300
  Initial Block Size 4.0 MB
301
  Current Block Size 4.0 MB
302
  Peak Allocated Bytes 2.1 MB
@@ -359,7 +605,7 @@ Memory Statistics:
359
  [ALLOC_TEMP_Job.Worker 3]
360
  Initial Block Size 256.0 KB
361
  Current Block Size 256.0 KB
362
- Peak Allocated Bytes 0 B
363
  Overflow Count 0
364
  [ALLOC_TEMP_Background Job.Worker 12]
365
  Initial Block Size 32.0 KB
@@ -414,7 +660,7 @@ Memory Statistics:
414
  [ALLOC_TEMP_Job.Worker 8]
415
  Initial Block Size 256.0 KB
416
  Current Block Size 256.0 KB
417
- Peak Allocated Bytes 0.7 KB
418
  Overflow Count 0
419
  [ALLOC_TEMP_OSX HID Input]
420
  Initial Block Size 64.0 KB
@@ -467,22 +713,22 @@ Memory Statistics:
467
  Peak Allocated Bytes 0 B
468
  Overflow Count 0
469
  [ALLOC_DEFAULT] Dual Thread Allocator
470
- Peak main deferred allocation count 5
471
  [ALLOC_BUCKET]
472
  Large Block size 4.0 MB
473
  Used Block count 1
474
  Peak Allocated bytes 1.0 MB
475
  [ALLOC_DEFAULT_MAIN]
476
- Peak usage frame count: [4.0 MB-8.0 MB]: 327786 frames
477
  Requested Block Size 16.0 MB
478
  Peak Block count 1
479
- Peak Allocated memory 5.2 MB
480
  Peak Large allocation bytes 0 B
481
  [ALLOC_DEFAULT_THREAD]
482
- Peak usage frame count: [16.0 MB-32.0 MB]: 327786 frames
483
  Requested Block Size 16.0 MB
484
  Peak Block count 1
485
- Peak Allocated memory 17.2 MB
486
  Peak Large allocation bytes 16.0 MB
487
  [ALLOC_TEMP_JOB_1_FRAME]
488
  Initial Block Size 2.0 MB
@@ -511,13 +757,13 @@ Memory Statistics:
511
  Used Block count 1
512
  Peak Allocated bytes 1.0 MB
513
  [ALLOC_GFX_MAIN]
514
- Peak usage frame count: [32.0 KB-64.0 KB]: 327785 frames, [64.0 KB-128.0 KB]: 1 frames
515
  Requested Block Size 16.0 MB
516
  Peak Block count 1
517
  Peak Allocated memory 65.6 KB
518
  Peak Large allocation bytes 0 B
519
  [ALLOC_GFX_THREAD]
520
- Peak usage frame count: [128.0 KB-256.0 KB]: 327786 frames
521
  Requested Block Size 16.0 MB
522
  Peak Block count 1
523
  Peak Allocated memory 173.5 KB
@@ -529,13 +775,13 @@ Memory Statistics:
529
  Used Block count 1
530
  Peak Allocated bytes 1.0 MB
531
  [ALLOC_CACHEOBJECTS_MAIN]
532
- Peak usage frame count: [0.5 MB-1.0 MB]: 327786 frames
533
  Requested Block Size 4.0 MB
534
  Peak Block count 1
535
  Peak Allocated memory 0.6 MB
536
  Peak Large allocation bytes 0 B
537
  [ALLOC_CACHEOBJECTS_THREAD]
538
- Peak usage frame count: [0.5 MB-1.0 MB]: 327785 frames, [2.0 MB-4.0 MB]: 1 frames
539
  Requested Block Size 4.0 MB
540
  Peak Block count 1
541
  Peak Allocated memory 3.4 MB
@@ -547,13 +793,13 @@ Memory Statistics:
547
  Used Block count 1
548
  Peak Allocated bytes 1.0 MB
549
  [ALLOC_TYPETREE_MAIN]
550
- Peak usage frame count: [0-1.0 KB]: 327786 frames
551
  Requested Block Size 2.0 MB
552
  Peak Block count 1
553
  Peak Allocated memory 1.0 KB
554
  Peak Large allocation bytes 0 B
555
  [ALLOC_TYPETREE_THREAD]
556
- Peak usage frame count: [1.0 KB-2.0 KB]: 327785 frames, [2.0 KB-4.0 KB]: 1 frames
557
  Requested Block Size 2.0 MB
558
  Peak Block count 1
559
  Peak Allocated memory 2.2 KB
 
10
  Renderer: Null Device
11
  Vendor: Unity Technologies
12
  Begin MonoManager ReloadAssembly
13
+ - Completed reload, in 0.034 seconds
14
  ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
15
  ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
16
  ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 
35
  WARNING: Shader Unsupported: 'Standard' - All subshaders removed
36
  WARNING: Shader Did you use #pragma only_renderers and omit this platform?
37
  WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
38
+ UnloadTime: 0.204709 ms
39
  Registered Communicator in Agent.
40
  ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
41
  TOO LONG
 
290
  TOO LONG
291
  TOO LONG
292
  TOO LONG
293
+ TOO LONG
294
+ TOO LONG
295
+ TOO LONG
296
+ TOO LONG
297
+ TOO LONG
298
+ TOO LONG
299
+ TOO LONG
300
+ TOO LONG
301
+ TOO LONG
302
+ TOO LONG
303
+ TOO LONG
304
+ TOO LONG
305
+ TOO LONG
306
+ TOO LONG
307
+ TOO LONG
308
+ TOO LONG
309
+ TOO LONG
310
+ TOO LONG
311
+ TOO LONG
312
+ TOO LONG
313
+ TOO LONG
314
+ TOO LONG
315
+ TOO LONG
316
+ TOO LONG
317
+ TOO LONG
318
+ TOO LONG
319
+ TOO LONG
320
+ TOO LONG
321
+ TOO LONG
322
+ TOO LONG
323
+ TOO LONG
324
+ TOO LONG
325
+ TOO LONG
326
+ TOO LONG
327
+ TOO LONG
328
+ TOO LONG
329
+ TOO LONG
330
+ TOO LONG
331
+ TOO LONG
332
+ TOO LONG
333
+ TOO LONG
334
+ TOO LONG
335
+ TOO LONG
336
+ TOO LONG
337
+ TOO LONG
338
+ TOO LONG
339
+ TOO LONG
340
+ TOO LONG
341
+ TOO LONG
342
+ TOO LONG
343
+ TOO LONG
344
+ TOO LONG
345
+ TOO LONG
346
+ TOO LONG
347
+ TOO LONG
348
+ TOO LONG
349
+ TOO LONG
350
+ TOO LONG
351
+ TOO LONG
352
+ TOO LONG
353
+ TOO LONG
354
+ TOO LONG
355
+ TOO LONG
356
+ TOO LONG
357
+ TOO LONG
358
+ TOO LONG
359
+ TOO LONG
360
+ TOO LONG
361
+ TOO LONG
362
+ TOO LONG
363
+ TOO LONG
364
+ TOO LONG
365
+ TOO LONG
366
+ TOO LONG
367
+ TOO LONG
368
+ TOO LONG
369
+ TOO LONG
370
+ TOO LONG
371
+ TOO LONG
372
+ TOO LONG
373
+ TOO LONG
374
+ TOO LONG
375
+ TOO LONG
376
+ TOO LONG
377
+ TOO LONG
378
+ TOO LONG
379
+ TOO LONG
380
+ TOO LONG
381
+ TOO LONG
382
+ TOO LONG
383
+ TOO LONG
384
+ TOO LONG
385
+ TOO LONG
386
+ TOO LONG
387
+ TOO LONG
388
+ TOO LONG
389
+ TOO LONG
390
+ TOO LONG
391
+ TOO LONG
392
+ TOO LONG
393
+ TOO LONG
394
+ TOO LONG
395
+ TOO LONG
396
+ TOO LONG
397
+ TOO LONG
398
+ TOO LONG
399
+ TOO LONG
400
+ TOO LONG
401
+ TOO LONG
402
+ TOO LONG
403
+ TOO LONG
404
+ TOO LONG
405
+ TOO LONG
406
+ TOO LONG
407
+ TOO LONG
408
+ TOO LONG
409
+ TOO LONG
410
+ TOO LONG
411
+ TOO LONG
412
+ TOO LONG
413
+ TOO LONG
414
+ TOO LONG
415
+ TOO LONG
416
+ TOO LONG
417
+ TOO LONG
418
+ TOO LONG
419
+ TOO LONG
420
+ TOO LONG
421
+ TOO LONG
422
+ TOO LONG
423
+ TOO LONG
424
+ TOO LONG
425
+ TOO LONG
426
+ TOO LONG
427
+ TOO LONG
428
+ TOO LONG
429
+ TOO LONG
430
+ TOO LONG
431
+ TOO LONG
432
+ TOO LONG
433
+ TOO LONG
434
+ TOO LONG
435
+ TOO LONG
436
+ TOO LONG
437
+ TOO LONG
438
+ TOO LONG
439
+ TOO LONG
440
+ TOO LONG
441
+ TOO LONG
442
+ TOO LONG
443
+ TOO LONG
444
+ TOO LONG
445
+ TOO LONG
446
+ TOO LONG
447
+ TOO LONG
448
+ TOO LONG
449
+ TOO LONG
450
+ TOO LONG
451
+ TOO LONG
452
+ TOO LONG
453
+ TOO LONG
454
+ TOO LONG
455
+ TOO LONG
456
+ TOO LONG
457
+ TOO LONG
458
+ TOO LONG
459
+ TOO LONG
460
+ TOO LONG
461
+ TOO LONG
462
+ TOO LONG
463
+ TOO LONG
464
+ TOO LONG
465
+ TOO LONG
466
+ TOO LONG
467
+ TOO LONG
468
+ TOO LONG
469
+ TOO LONG
470
+ TOO LONG
471
+ TOO LONG
472
+ TOO LONG
473
+ TOO LONG
474
+ TOO LONG
475
+ TOO LONG
476
+ TOO LONG
477
+ TOO LONG
478
+ TOO LONG
479
+ TOO LONG
480
+ TOO LONG
481
+ TOO LONG
482
+ TOO LONG
483
+ TOO LONG
484
+ TOO LONG
485
+ TOO LONG
486
+ TOO LONG
487
+ TOO LONG
488
+ TOO LONG
489
+ TOO LONG
490
+ TOO LONG
491
+ TOO LONG
492
+ TOO LONG
493
+ TOO LONG
494
+ TOO LONG
495
+ TOO LONG
496
+ TOO LONG
497
+ TOO LONG
498
+ TOO LONG
499
+ TOO LONG
500
+ TOO LONG
501
+ TOO LONG
502
+ TOO LONG
503
+ TOO LONG
504
+ TOO LONG
505
+ TOO LONG
506
+ TOO LONG
507
+ TOO LONG
508
+ TOO LONG
509
+ TOO LONG
510
+ TOO LONG
511
+ TOO LONG
512
+ TOO LONG
513
+ TOO LONG
514
+ TOO LONG
515
+ TOO LONG
516
+ TOO LONG
517
+ TOO LONG
518
+ TOO LONG
519
+ TOO LONG
520
+ TOO LONG
521
+ TOO LONG
522
+ TOO LONG
523
+ TOO LONG
524
+ TOO LONG
525
+ TOO LONG
526
+ TOO LONG
527
+ TOO LONG
528
+ TOO LONG
529
+ TOO LONG
530
+ TOO LONG
531
+ TOO LONG
532
+ TOO LONG
533
+ TOO LONG
534
+ TOO LONG
535
+ TOO LONG
536
+ TOO LONG
537
+ TOO LONG
538
+ TOO LONG
539
+ Thread 0x1711cf000 may have been prematurely finalized
540
  Setting up 6 worker threads for Enlighten.
541
  Memory Statistics:
542
  [ALLOC_TEMP_TLS] TLS Allocator
543
  StackAllocators :
544
  [ALLOC_TEMP_MAIN]
545
+ Peak usage frame count: [8.0 KB-16.0 KB]: 94692 frames, [2.0 MB-4.0 MB]: 1 frames
546
  Initial Block Size 4.0 MB
547
  Current Block Size 4.0 MB
548
  Peak Allocated Bytes 2.1 MB
 
605
  [ALLOC_TEMP_Job.Worker 3]
606
  Initial Block Size 256.0 KB
607
  Current Block Size 256.0 KB
608
+ Peak Allocated Bytes 0.7 KB
609
  Overflow Count 0
610
  [ALLOC_TEMP_Background Job.Worker 12]
611
  Initial Block Size 32.0 KB
 
660
  [ALLOC_TEMP_Job.Worker 8]
661
  Initial Block Size 256.0 KB
662
  Current Block Size 256.0 KB
663
+ Peak Allocated Bytes 0 B
664
  Overflow Count 0
665
  [ALLOC_TEMP_OSX HID Input]
666
  Initial Block Size 64.0 KB
 
713
  Peak Allocated Bytes 0 B
714
  Overflow Count 0
715
  [ALLOC_DEFAULT] Dual Thread Allocator
716
+ Peak main deferred allocation count 6
717
  [ALLOC_BUCKET]
718
  Large Block size 4.0 MB
719
  Used Block count 1
720
  Peak Allocated bytes 1.0 MB
721
  [ALLOC_DEFAULT_MAIN]
722
+ Peak usage frame count: [4.0 MB-8.0 MB]: 94693 frames
723
  Requested Block Size 16.0 MB
724
  Peak Block count 1
725
+ Peak Allocated memory 5.0 MB
726
  Peak Large allocation bytes 0 B
727
  [ALLOC_DEFAULT_THREAD]
728
+ Peak usage frame count: [16.0 MB-32.0 MB]: 94693 frames
729
  Requested Block Size 16.0 MB
730
  Peak Block count 1
731
+ Peak Allocated memory 17.4 MB
732
  Peak Large allocation bytes 16.0 MB
733
  [ALLOC_TEMP_JOB_1_FRAME]
734
  Initial Block Size 2.0 MB
 
757
  Used Block count 1
758
  Peak Allocated bytes 1.0 MB
759
  [ALLOC_GFX_MAIN]
760
+ Peak usage frame count: [32.0 KB-64.0 KB]: 94692 frames, [64.0 KB-128.0 KB]: 1 frames
761
  Requested Block Size 16.0 MB
762
  Peak Block count 1
763
  Peak Allocated memory 65.6 KB
764
  Peak Large allocation bytes 0 B
765
  [ALLOC_GFX_THREAD]
766
+ Peak usage frame count: [128.0 KB-256.0 KB]: 94693 frames
767
  Requested Block Size 16.0 MB
768
  Peak Block count 1
769
  Peak Allocated memory 173.5 KB
 
775
  Used Block count 1
776
  Peak Allocated bytes 1.0 MB
777
  [ALLOC_CACHEOBJECTS_MAIN]
778
+ Peak usage frame count: [0.5 MB-1.0 MB]: 94693 frames
779
  Requested Block Size 4.0 MB
780
  Peak Block count 1
781
  Peak Allocated memory 0.6 MB
782
  Peak Large allocation bytes 0 B
783
  [ALLOC_CACHEOBJECTS_THREAD]
784
+ Peak usage frame count: [0.5 MB-1.0 MB]: 94692 frames, [2.0 MB-4.0 MB]: 1 frames
785
  Requested Block Size 4.0 MB
786
  Peak Block count 1
787
  Peak Allocated memory 3.4 MB
 
793
  Used Block count 1
794
  Peak Allocated bytes 1.0 MB
795
  [ALLOC_TYPETREE_MAIN]
796
+ Peak usage frame count: [0-1.0 KB]: 94693 frames
797
  Requested Block Size 2.0 MB
798
  Peak Block count 1
799
  Peak Allocated memory 1.0 KB
800
  Peak Large allocation bytes 0 B
801
  [ALLOC_TYPETREE_THREAD]
802
+ Peak usage frame count: [1.0 KB-2.0 KB]: 94692 frames, [2.0 KB-4.0 KB]: 1 frames
803
  Requested Block Size 2.0 MB
804
  Peak Block count 1
805
  Peak Allocated memory 2.2 KB
run_logs/timers.json CHANGED
@@ -2,201 +2,201 @@
2
  "name": "root",
3
  "gauges": {
4
  "SoccerTwos.Policy.Entropy.mean": {
5
- "value": 1.3300622701644897,
6
- "min": 1.266438364982605,
7
- "max": 3.29573655128479,
8
- "count": 1740
9
  },
10
  "SoccerTwos.Policy.Entropy.sum": {
11
- "value": 27069.427734375,
12
- "min": 21218.80078125,
13
- "max": 106789.578125,
14
- "count": 1740
15
  },
16
  "SoccerTwos.Environment.EpisodeLength.mean": {
17
- "value": 89.76363636363637,
18
- "min": 40.675213675213676,
19
  "max": 999.0,
20
- "count": 1740
21
  },
22
  "SoccerTwos.Environment.EpisodeLength.sum": {
23
- "value": 19748.0,
24
- "min": 9376.0,
25
- "max": 31520.0,
26
- "count": 1740
27
  },
28
  "SoccerTwos.Self-play.ELO.mean": {
29
- "value": 1673.6429207825179,
30
- "min": 1196.5457435177627,
31
- "max": 1726.4687385612406,
32
- "count": 1739
33
  },
34
  "SoccerTwos.Self-play.ELO.sum": {
35
- "value": 184100.72128607697,
36
- "min": 2394.535852594916,
37
- "max": 376556.50433398865,
38
- "count": 1739
39
  },
40
  "SoccerTwos.Step.mean": {
41
- "value": 17399884.0,
42
- "min": 9778.0,
43
- "max": 17399884.0,
44
- "count": 1740
45
  },
46
  "SoccerTwos.Step.sum": {
47
- "value": 17399884.0,
48
- "min": 9778.0,
49
- "max": 17399884.0,
50
- "count": 1740
51
  },
52
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
53
- "value": -0.04988090693950653,
54
- "min": -0.13098840415477753,
55
- "max": 0.16840921342372894,
56
- "count": 1740
57
  },
58
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
59
- "value": -5.536780834197998,
60
- "min": -19.894561767578125,
61
- "max": 21.182220458984375,
62
- "count": 1740
63
  },
64
  "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
65
- "value": -0.049323659390211105,
66
- "min": -0.13105210661888123,
67
- "max": 0.17191989719867706,
68
- "count": 1740
69
  },
70
  "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
71
- "value": -5.474925994873047,
72
- "min": -20.791091918945312,
73
- "max": 21.83549690246582,
74
- "count": 1740
75
  },
76
  "SoccerTwos.Environment.CumulativeReward.mean": {
77
  "value": 0.0,
78
  "min": 0.0,
79
  "max": 0.0,
80
- "count": 1740
81
  },
82
  "SoccerTwos.Environment.CumulativeReward.sum": {
83
  "value": 0.0,
84
  "min": 0.0,
85
  "max": 0.0,
86
- "count": 1740
87
  },
88
  "SoccerTwos.Policy.ExtrinsicReward.mean": {
89
- "value": -0.19373873762182287,
90
- "min": -0.6153846153846154,
91
- "max": 0.42934736766313253,
92
- "count": 1740
93
  },
94
  "SoccerTwos.Policy.ExtrinsicReward.sum": {
95
- "value": -21.50499987602234,
96
- "min": -55.30279994010925,
97
- "max": 52.12959986925125,
98
- "count": 1740
99
  },
100
  "SoccerTwos.Environment.GroupCumulativeReward.mean": {
101
- "value": -0.19373873762182287,
102
- "min": -0.6153846153846154,
103
- "max": 0.42934736766313253,
104
- "count": 1740
105
  },
106
  "SoccerTwos.Environment.GroupCumulativeReward.sum": {
107
- "value": -21.50499987602234,
108
- "min": -55.30279994010925,
109
- "max": 52.12959986925125,
110
- "count": 1740
111
  },
112
  "SoccerTwos.IsTraining.mean": {
113
  "value": 1.0,
114
  "min": 1.0,
115
  "max": 1.0,
116
- "count": 1740
117
  },
118
  "SoccerTwos.IsTraining.sum": {
119
  "value": 1.0,
120
  "min": 1.0,
121
  "max": 1.0,
122
- "count": 1740
123
  },
124
  "SoccerTwos.Losses.PolicyLoss.mean": {
125
- "value": 0.018441027875026824,
126
- "min": 0.011074252808854605,
127
- "max": 0.029008984806326528,
128
- "count": 843
129
  },
130
  "SoccerTwos.Losses.PolicyLoss.sum": {
131
- "value": 0.018441027875026824,
132
- "min": 0.011074252808854605,
133
- "max": 0.029008984806326528,
134
- "count": 843
135
  },
136
  "SoccerTwos.Losses.ValueLoss.mean": {
137
- "value": 0.08094811787207921,
138
- "min": 0.0011656492541078478,
139
- "max": 0.11928065071503322,
140
- "count": 843
141
  },
142
  "SoccerTwos.Losses.ValueLoss.sum": {
143
- "value": 0.08094811787207921,
144
- "min": 0.0011656492541078478,
145
- "max": 0.11928065071503322,
146
- "count": 843
147
  },
148
  "SoccerTwos.Losses.BaselineLoss.mean": {
149
- "value": 0.08201082050800323,
150
- "min": 0.0011800630503178884,
151
- "max": 0.12257990539073944,
152
- "count": 843
153
  },
154
  "SoccerTwos.Losses.BaselineLoss.sum": {
155
- "value": 0.08201082050800323,
156
- "min": 0.0011800630503178884,
157
- "max": 0.12257990539073944,
158
- "count": 843
159
  },
160
  "SoccerTwos.Policy.LearningRate.mean": {
161
- "value": 0.0003260040147992041,
162
- "min": 0.0003260040147992041,
163
- "max": 0.0004997152400569519,
164
- "count": 843
165
  },
166
  "SoccerTwos.Policy.LearningRate.sum": {
167
- "value": 0.0003260040147992041,
168
- "min": 0.0003260040147992041,
169
- "max": 0.0004997152400569519,
170
- "count": 843
171
  },
172
  "SoccerTwos.Policy.Epsilon.mean": {
173
- "value": 0.16520079599999996,
174
- "min": 0.16520079599999996,
175
- "max": 0.19994304799999996,
176
- "count": 843
177
  },
178
  "SoccerTwos.Policy.Epsilon.sum": {
179
- "value": 0.16520079599999996,
180
- "min": 0.16520079599999996,
181
- "max": 0.19994304799999996,
182
- "count": 843
183
  },
184
  "SoccerTwos.Policy.Beta.mean": {
185
- "value": 0.003263519720399999,
186
- "min": 0.003263519720399999,
187
- "max": 0.004997158095199998,
188
- "count": 843
189
  },
190
  "SoccerTwos.Policy.Beta.sum": {
191
- "value": 0.003263519720399999,
192
- "min": 0.003263519720399999,
193
- "max": 0.004997158095199998,
194
- "count": 843
195
  }
196
  },
197
  "metadata": {
198
  "timer_format_version": "0.1.0",
199
- "start_time_seconds": "1703778636",
200
  "python_version": "3.10.12 (main, Jul 5 2023, 15:02:25) [Clang 14.0.6 ]",
201
  "command_line_arguments": "/opt/homebrew/Caskroom/miniconda/base/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.app --run-id=SoccerTwos --no-graphics --force",
202
  "mlagents_version": "1.1.0.dev0",
@@ -204,103 +204,103 @@
204
  "communication_protocol_version": "1.5.0",
205
  "pytorch_version": "2.1.2",
206
  "numpy_version": "1.23.5",
207
- "end_time_seconds": "1703795928"
208
  },
209
- "total": 17291.35947341699,
210
  "count": 1,
211
- "self": 10.002615667006467,
212
  "children": {
213
  "run_training.setup": {
214
- "total": 0.014216332987416536,
215
  "count": 1,
216
- "self": 0.014216332987416536
217
  },
218
  "TrainerController.start_learning": {
219
- "total": 17281.342641416995,
220
  "count": 1,
221
- "self": 7.727816474769497,
222
  "children": {
223
  "TrainerController._reset_env": {
224
- "total": 1.8024594139424153,
225
- "count": 70,
226
- "self": 1.8024594139424153
227
  },
228
  "TrainerController.advance": {
229
- "total": 17271.652083277266,
230
- "count": 1196889,
231
- "self": 7.361157477425877,
232
  "children": {
233
  "env_step": {
234
- "total": 7843.07346421259,
235
- "count": 1196889,
236
- "self": 6619.223402722797,
237
  "children": {
238
  "SubprocessEnvManager._take_step": {
239
- "total": 1218.7477199516725,
240
- "count": 1196889,
241
- "self": 36.26535058821901,
242
  "children": {
243
  "TorchPolicy.evaluate": {
244
- "total": 1182.4823693634535,
245
- "count": 2185268,
246
- "self": 1182.4823693634535
247
  }
248
  }
249
  },
250
  "workers": {
251
- "total": 5.102341538120527,
252
- "count": 1196888,
253
  "self": 0.0,
254
  "children": {
255
  "worker_root": {
256
- "total": 17268.48108889186,
257
- "count": 1196888,
258
  "is_parallel": true,
259
- "self": 11671.18532553385,
260
  "children": {
261
  "steps_from_proto": {
262
- "total": 0.044110004091635346,
263
- "count": 140,
264
  "is_parallel": true,
265
- "self": 0.0071852429246064276,
266
  "children": {
267
  "_process_rank_one_or_two_observation": {
268
- "total": 0.03692476116702892,
269
- "count": 560,
270
  "is_parallel": true,
271
- "self": 0.03692476116702892
272
  }
273
  }
274
  },
275
  "UnityEnvironment.step": {
276
- "total": 5597.2516533539165,
277
- "count": 1196888,
278
  "is_parallel": true,
279
- "self": 272.46567574935034,
280
  "children": {
281
  "UnityEnvironment._generate_step_input": {
282
- "total": 129.84849359397776,
283
- "count": 1196888,
284
  "is_parallel": true,
285
- "self": 129.84849359397776
286
  },
287
  "communicator.exchange": {
288
- "total": 4506.445674063638,
289
- "count": 1196888,
290
  "is_parallel": true,
291
- "self": 4506.445674063638
292
  },
293
  "steps_from_proto": {
294
- "total": 688.4918099469505,
295
- "count": 2393776,
296
  "is_parallel": true,
297
- "self": 106.13120424517547,
298
  "children": {
299
  "_process_rank_one_or_two_observation": {
300
- "total": 582.3606057017751,
301
- "count": 9575104,
302
  "is_parallel": true,
303
- "self": 582.3606057017751
304
  }
305
  }
306
  }
@@ -313,31 +313,31 @@
313
  }
314
  },
315
  "trainer_advance": {
316
- "total": 9421.21746158725,
317
- "count": 1196888,
318
- "self": 69.65316009536036,
319
  "children": {
320
  "process_trajectory": {
321
- "total": 1950.7394902148517,
322
- "count": 1196888,
323
- "self": 1945.4922155466338,
324
  "children": {
325
  "RLTrainer._checkpoint": {
326
- "total": 5.2472746682178695,
327
- "count": 34,
328
- "self": 5.2472746682178695
329
  }
330
  }
331
  },
332
  "_update_policy": {
333
- "total": 7400.824811277038,
334
- "count": 843,
335
- "self": 830.3490734959778,
336
  "children": {
337
  "TorchPOCAOptimizer.update": {
338
- "total": 6570.47573778106,
339
- "count": 25299,
340
- "self": 6570.47573778106
341
  }
342
  }
343
  }
@@ -346,19 +346,19 @@
346
  }
347
  },
348
  "trainer_threads": {
349
- "total": 3.33995558321476e-07,
350
  "count": 1,
351
- "self": 3.33995558321476e-07
352
  },
353
  "TrainerController._save_models": {
354
- "total": 0.1602819170220755,
355
  "count": 1,
356
- "self": 0.0015421260322909802,
357
  "children": {
358
  "RLTrainer._checkpoint": {
359
- "total": 0.15873979098978452,
360
  "count": 1,
361
- "self": 0.15873979098978452
362
  }
363
  }
364
  }
 
2
  "name": "root",
3
  "gauges": {
4
  "SoccerTwos.Policy.Entropy.mean": {
5
+ "value": 1.755637288093567,
6
+ "min": 1.7151814699172974,
7
+ "max": 3.295724630355835,
8
+ "count": 499
9
  },
10
  "SoccerTwos.Policy.Entropy.sum": {
11
+ "value": 36910.51953125,
12
+ "min": 13612.6572265625,
13
+ "max": 172905.75,
14
+ "count": 499
15
  },
16
  "SoccerTwos.Environment.EpisodeLength.mean": {
17
+ "value": 63.6125,
18
+ "min": 39.645161290322584,
19
  "max": 999.0,
20
+ "count": 499
21
  },
22
  "SoccerTwos.Environment.EpisodeLength.sum": {
23
+ "value": 20356.0,
24
+ "min": 10692.0,
25
+ "max": 31500.0,
26
+ "count": 499
27
  },
28
  "SoccerTwos.Self-play.ELO.mean": {
29
+ "value": 1540.6404213531655,
30
+ "min": 1197.4957713356807,
31
+ "max": 1576.4143309371482,
32
+ "count": 478
33
  },
34
  "SoccerTwos.Self-play.ELO.sum": {
35
+ "value": 246502.4674165065,
36
+ "min": 2399.421175774324,
37
+ "max": 363079.2013600959,
38
+ "count": 478
39
  },
40
  "SoccerTwos.Step.mean": {
41
+ "value": 4999972.0,
42
+ "min": 9254.0,
43
+ "max": 4999972.0,
44
+ "count": 500
45
  },
46
  "SoccerTwos.Step.sum": {
47
+ "value": 4999972.0,
48
+ "min": 9254.0,
49
+ "max": 4999972.0,
50
+ "count": 500
51
  },
52
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
53
+ "value": -0.034482039511203766,
54
+ "min": -0.10746785998344421,
55
+ "max": 0.16136549413204193,
56
+ "count": 500
57
  },
58
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
59
+ "value": -5.517126083374023,
60
+ "min": -22.675718307495117,
61
+ "max": 27.432022094726562,
62
+ "count": 500
63
  },
64
  "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
65
+ "value": -0.034504301846027374,
66
+ "min": -0.11580751091241837,
67
+ "max": 0.1590351015329361,
68
+ "count": 500
69
  },
70
  "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
71
+ "value": -5.520688533782959,
72
+ "min": -24.43538475036621,
73
+ "max": 26.952106475830078,
74
+ "count": 500
75
  },
76
  "SoccerTwos.Environment.CumulativeReward.mean": {
77
  "value": 0.0,
78
  "min": 0.0,
79
  "max": 0.0,
80
+ "count": 500
81
  },
82
  "SoccerTwos.Environment.CumulativeReward.sum": {
83
  "value": 0.0,
84
  "min": 0.0,
85
  "max": 0.0,
86
+ "count": 500
87
  },
88
  "SoccerTwos.Policy.ExtrinsicReward.mean": {
89
+ "value": -0.08047500103712082,
90
+ "min": -0.5921090895479376,
91
+ "max": 0.4576799988746643,
92
+ "count": 500
93
  },
94
  "SoccerTwos.Policy.ExtrinsicReward.sum": {
95
+ "value": -12.876000165939331,
96
+ "min": -66.35360014438629,
97
+ "max": 60.00919944047928,
98
+ "count": 500
99
  },
100
  "SoccerTwos.Environment.GroupCumulativeReward.mean": {
101
+ "value": -0.08047500103712082,
102
+ "min": -0.5921090895479376,
103
+ "max": 0.4576799988746643,
104
+ "count": 500
105
  },
106
  "SoccerTwos.Environment.GroupCumulativeReward.sum": {
107
+ "value": -12.876000165939331,
108
+ "min": -66.35360014438629,
109
+ "max": 60.00919944047928,
110
+ "count": 500
111
  },
112
  "SoccerTwos.IsTraining.mean": {
113
  "value": 1.0,
114
  "min": 1.0,
115
  "max": 1.0,
116
+ "count": 500
117
  },
118
  "SoccerTwos.IsTraining.sum": {
119
  "value": 1.0,
120
  "min": 1.0,
121
  "max": 1.0,
122
+ "count": 500
123
  },
124
  "SoccerTwos.Losses.PolicyLoss.mean": {
125
+ "value": 0.015034021192695946,
126
+ "min": 0.010941779592152064,
127
+ "max": 0.024873137117053072,
128
+ "count": 239
129
  },
130
  "SoccerTwos.Losses.PolicyLoss.sum": {
131
+ "value": 0.015034021192695946,
132
+ "min": 0.010941779592152064,
133
+ "max": 0.024873137117053072,
134
+ "count": 239
135
  },
136
  "SoccerTwos.Losses.ValueLoss.mean": {
137
+ "value": 0.11739198019107183,
138
+ "min": 3.1021232795562052e-06,
139
+ "max": 0.1251884085436662,
140
+ "count": 239
141
  },
142
  "SoccerTwos.Losses.ValueLoss.sum": {
143
+ "value": 0.11739198019107183,
144
+ "min": 3.1021232795562052e-06,
145
+ "max": 0.1251884085436662,
146
+ "count": 239
147
  },
148
  "SoccerTwos.Losses.BaselineLoss.mean": {
149
+ "value": 0.11775108724832535,
150
+ "min": 3.304618659664508e-06,
151
+ "max": 0.1258082126577695,
152
+ "count": 239
153
  },
154
  "SoccerTwos.Losses.BaselineLoss.sum": {
155
+ "value": 0.11775108724832535,
156
+ "min": 3.304618659664508e-06,
157
+ "max": 0.1258082126577695,
158
+ "count": 239
159
  },
160
  "SoccerTwos.Policy.LearningRate.mean": {
161
+ "value": 1.0132997973599917e-06,
162
+ "min": 1.0132997973599917e-06,
163
+ "max": 0.0004968980006203998,
164
+ "count": 239
165
  },
166
  "SoccerTwos.Policy.LearningRate.sum": {
167
+ "value": 1.0132997973599917e-06,
168
+ "min": 1.0132997973599917e-06,
169
+ "max": 0.0004968980006203998,
170
+ "count": 239
171
  },
172
  "SoccerTwos.Policy.Epsilon.mean": {
173
+ "value": 0.10020264000000001,
174
+ "min": 0.10020264000000001,
175
+ "max": 0.19937960000000005,
176
+ "count": 239
177
  },
178
  "SoccerTwos.Policy.Epsilon.sum": {
179
+ "value": 0.10020264000000001,
180
+ "min": 0.10020264000000001,
181
+ "max": 0.19937960000000005,
182
+ "count": 239
183
  },
184
  "SoccerTwos.Policy.Beta.mean": {
185
+ "value": 2.0111735999999927e-05,
186
+ "min": 2.0111735999999927e-05,
187
+ "max": 0.004969042040000001,
188
+ "count": 239
189
  },
190
  "SoccerTwos.Policy.Beta.sum": {
191
+ "value": 2.0111735999999927e-05,
192
+ "min": 2.0111735999999927e-05,
193
+ "max": 0.004969042040000001,
194
+ "count": 239
195
  }
196
  },
197
  "metadata": {
198
  "timer_format_version": "0.1.0",
199
+ "start_time_seconds": "1703848764",
200
  "python_version": "3.10.12 (main, Jul 5 2023, 15:02:25) [Clang 14.0.6 ]",
201
  "command_line_arguments": "/opt/homebrew/Caskroom/miniconda/base/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.app --run-id=SoccerTwos --no-graphics --force",
202
  "mlagents_version": "1.1.0.dev0",
 
204
  "communication_protocol_version": "1.5.0",
205
  "pytorch_version": "2.1.2",
206
  "numpy_version": "1.23.5",
207
+ "end_time_seconds": "1703853889"
208
  },
209
+ "total": 5124.430119083001,
210
  "count": 1,
211
+ "self": 0.19001916600973345,
212
  "children": {
213
  "run_training.setup": {
214
+ "total": 0.012270416977116838,
215
  "count": 1,
216
+ "self": 0.012270416977116838
217
  },
218
  "TrainerController.start_learning": {
219
+ "total": 5124.227829500014,
220
  "count": 1,
221
+ "self": 2.531355981802335,
222
  "children": {
223
  "TrainerController._reset_env": {
224
+ "total": 1.5887895020714495,
225
+ "count": 20,
226
+ "self": 1.5887895020714495
227
  },
228
  "TrainerController.advance": {
229
+ "total": 5119.955040642148,
230
+ "count": 341985,
231
+ "self": 2.185286336200079,
232
  "children": {
233
  "env_step": {
234
+ "total": 2303.891035468987,
235
+ "count": 341985,
236
+ "self": 1941.7491068352829,
237
  "children": {
238
  "SubprocessEnvManager._take_step": {
239
+ "total": 360.6655651805049,
240
+ "count": 341985,
241
+ "self": 11.17105897743022,
242
  "children": {
243
  "TorchPolicy.evaluate": {
244
+ "total": 349.4945062030747,
245
+ "count": 631296,
246
+ "self": 349.4945062030747
247
  }
248
  }
249
  },
250
  "workers": {
251
+ "total": 1.4763634531991556,
252
+ "count": 341985,
253
  "self": 0.0,
254
  "children": {
255
  "worker_root": {
256
+ "total": 5119.23122701954,
257
+ "count": 341985,
258
  "is_parallel": true,
259
+ "self": 3492.6540978672565,
260
  "children": {
261
  "steps_from_proto": {
262
+ "total": 0.013060167053481564,
263
+ "count": 40,
264
  "is_parallel": true,
265
+ "self": 0.0021915972174610943,
266
  "children": {
267
  "_process_rank_one_or_two_observation": {
268
+ "total": 0.01086856983602047,
269
+ "count": 160,
270
  "is_parallel": true,
271
+ "self": 0.01086856983602047
272
  }
273
  }
274
  },
275
  "UnityEnvironment.step": {
276
+ "total": 1626.5640689852298,
277
+ "count": 341985,
278
  "is_parallel": true,
279
+ "self": 78.99318619386759,
280
  "children": {
281
  "UnityEnvironment._generate_step_input": {
282
+ "total": 37.23996753204847,
283
+ "count": 341985,
284
  "is_parallel": true,
285
+ "self": 37.23996753204847
286
  },
287
  "communicator.exchange": {
288
+ "total": 1310.1512493426271,
289
+ "count": 341985,
290
  "is_parallel": true,
291
+ "self": 1310.1512493426271
292
  },
293
  "steps_from_proto": {
294
+ "total": 200.17966591668664,
295
+ "count": 683970,
296
  "is_parallel": true,
297
+ "self": 30.950994182756403,
298
  "children": {
299
  "_process_rank_one_or_two_observation": {
300
+ "total": 169.22867173393024,
301
+ "count": 2735880,
302
  "is_parallel": true,
303
+ "self": 169.22867173393024
304
  }
305
  }
306
  }
 
313
  }
314
  },
315
  "trainer_advance": {
316
+ "total": 2813.8787188369606,
317
+ "count": 341985,
318
+ "self": 21.16630858287681,
319
  "children": {
320
  "process_trajectory": {
321
+ "total": 556.1312195862702,
322
+ "count": 341985,
323
+ "self": 554.5936779602489,
324
  "children": {
325
  "RLTrainer._checkpoint": {
326
+ "total": 1.537541626021266,
327
+ "count": 10,
328
+ "self": 1.537541626021266
329
  }
330
  }
331
  },
332
  "_update_policy": {
333
+ "total": 2236.5811906678136,
334
+ "count": 239,
335
+ "self": 242.41541127837263,
336
  "children": {
337
  "TorchPOCAOptimizer.update": {
338
+ "total": 1994.165779389441,
339
+ "count": 7185,
340
+ "self": 1994.165779389441
341
  }
342
  }
343
  }
 
346
  }
347
  },
348
  "trainer_threads": {
349
+ "total": 3.3300602808594704e-07,
350
  "count": 1,
351
+ "self": 3.3300602808594704e-07
352
  },
353
  "TrainerController._save_models": {
354
+ "total": 0.15264304098673165,
355
  "count": 1,
356
+ "self": 0.000656957970932126,
357
  "children": {
358
  "RLTrainer._checkpoint": {
359
+ "total": 0.15198608301579952,
360
  "count": 1,
361
+ "self": 0.15198608301579952
362
  }
363
  }
364
  }
run_logs/training_status.json CHANGED
@@ -2,59 +2,59 @@
2
  "SoccerTwos": {
3
  "checkpoints": [
4
  {
5
- "steps": 15499904,
6
- "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-15499904.onnx",
7
  "reward": 0.0,
8
- "creation_time": 1703794033.6399949,
9
  "auxillary_file_paths": [
10
- "results/SoccerTwos/SoccerTwos/SoccerTwos-15499904.pt"
11
  ]
12
  },
13
  {
14
- "steps": 15999958,
15
- "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-15999958.onnx",
16
  "reward": 0.0,
17
- "creation_time": 1703794534.1326778,
18
  "auxillary_file_paths": [
19
- "results/SoccerTwos/SoccerTwos/SoccerTwos-15999958.pt"
20
  ]
21
  },
22
  {
23
- "steps": 16499979,
24
- "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-16499979.onnx",
25
  "reward": 0.0,
26
- "creation_time": 1703795023.9592068,
27
  "auxillary_file_paths": [
28
- "results/SoccerTwos/SoccerTwos/SoccerTwos-16499979.pt"
29
  ]
30
  },
31
  {
32
- "steps": 16999852,
33
- "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-16999852.onnx",
34
  "reward": 0.0,
35
- "creation_time": 1703795515.021195,
36
  "auxillary_file_paths": [
37
- "results/SoccerTwos/SoccerTwos/SoccerTwos-16999852.pt"
38
  ]
39
  },
40
  {
41
- "steps": 17409136,
42
- "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-17409136.onnx",
43
  "reward": 0.0,
44
- "creation_time": 1703795918.066219,
45
  "auxillary_file_paths": [
46
- "results/SoccerTwos/SoccerTwos/SoccerTwos-17409136.pt"
47
  ]
48
  }
49
  ],
50
- "elo": 1673.7859725087915,
51
  "final_checkpoint": {
52
- "steps": 17409136,
53
  "file_path": "results/SoccerTwos/SoccerTwos.onnx",
54
  "reward": 0.0,
55
- "creation_time": 1703795918.066219,
56
  "auxillary_file_paths": [
57
- "results/SoccerTwos/SoccerTwos/SoccerTwos-17409136.pt"
58
  ]
59
  }
60
  },
 
2
  "SoccerTwos": {
3
  "checkpoints": [
4
  {
5
+ "steps": 3499990,
6
+ "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-3499990.onnx",
7
  "reward": 0.0,
8
+ "creation_time": 1703852337.048543,
9
  "auxillary_file_paths": [
10
+ "results/SoccerTwos/SoccerTwos/SoccerTwos-3499990.pt"
11
  ]
12
  },
13
  {
14
+ "steps": 3999988,
15
+ "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-3999988.onnx",
16
  "reward": 0.0,
17
+ "creation_time": 1703852850.532505,
18
  "auxillary_file_paths": [
19
+ "results/SoccerTwos/SoccerTwos/SoccerTwos-3999988.pt"
20
  ]
21
  },
22
  {
23
+ "steps": 4499985,
24
+ "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-4499985.onnx",
25
  "reward": 0.0,
26
+ "creation_time": 1703853379.401021,
27
  "auxillary_file_paths": [
28
+ "results/SoccerTwos/SoccerTwos/SoccerTwos-4499985.pt"
29
  ]
30
  },
31
  {
32
+ "steps": 4999972,
33
+ "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-4999972.onnx",
34
  "reward": 0.0,
35
+ "creation_time": 1703853888.732385,
36
  "auxillary_file_paths": [
37
+ "results/SoccerTwos/SoccerTwos/SoccerTwos-4999972.pt"
38
  ]
39
  },
40
  {
41
+ "steps": 5000376,
42
+ "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-5000376.onnx",
43
  "reward": 0.0,
44
+ "creation_time": 1703853888.9599922,
45
  "auxillary_file_paths": [
46
+ "results/SoccerTwos/SoccerTwos/SoccerTwos-5000376.pt"
47
  ]
48
  }
49
  ],
50
+ "elo": 1543.402385883174,
51
  "final_checkpoint": {
52
+ "steps": 5000376,
53
  "file_path": "results/SoccerTwos/SoccerTwos.onnx",
54
  "reward": 0.0,
55
+ "creation_time": 1703853888.9599922,
56
  "auxillary_file_paths": [
57
+ "results/SoccerTwos/SoccerTwos/SoccerTwos-5000376.pt"
58
  ]
59
  }
60
  },