Statos6 commited on
Commit
55a8929
1 Parent(s): f5c5d35
SoccerTwos.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8b6d608c4248e0b310070b2af2b4ea2275b174aeed4ae07c4b7ff7524ee580d5
3
  size 895526
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78d80a03b6c3ffa7be5d4037e3815a3696b1e1198da3bea1d6bcfc61028f6587
3
  size 895526
SoccerTwos/SoccerTwos-13499994.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ad54bea8430cb2786318de3ce8dde082b5f65d22499ece282e7c51cad5dfdad
3
+ size 895526
SoccerTwos/SoccerTwos-13499994.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:984e380fa477b8269f25a1e5f34519a210f75d9ce207300e85a586c3bedefbc8
3
+ size 10325290
SoccerTwos/SoccerTwos-13999986.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4cf6c9eb6e522f7d25eb7e5e92d7c331bea382d26bbf1980680217d2161c6257
3
+ size 895526
SoccerTwos/SoccerTwos-13999986.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28b465cf20ff188aec6de3d33e14b17ed46e2af4cee6410df185c96dfe51df34
3
+ size 10325290
SoccerTwos/SoccerTwos-14499998.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e48ad434cf6c13fe55dfe514fb5c912e928dafcd12fb78ebcce137c40e0610f9
3
+ size 895526
SoccerTwos/SoccerTwos-14499998.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b7a40b1cf22bd1c8975c79ebf98fb6728392a5c082ebb0c4325bcab83ecf9ed7
3
+ size 10325290
SoccerTwos/SoccerTwos-14999982.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:387813bafb9dfb3244a8e0b084dd2b2b21f2fe6895e52b6f93247fa389f90105
3
+ size 895526
SoccerTwos/SoccerTwos-14999982.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dcc979094443202bf62830d19a8f572eb192a0dcb0b65502c8f1a3c6b2c29cf8
3
+ size 10325290
SoccerTwos/SoccerTwos-15000014.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78d80a03b6c3ffa7be5d4037e3815a3696b1e1198da3bea1d6bcfc61028f6587
3
+ size 895526
SoccerTwos/SoccerTwos-15000014.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aae125a758c60aebaea95e62b8c64d403e394391f33d5fe49424f886618188f6
3
+ size 10325290
SoccerTwos/checkpoint.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:37854fa1cf62607fbcf6e1fa3522fdc3890a2084987edc894f3955253d66549d
3
  size 10323922
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:55c392f23767ea885f166609ad60d396536d6c5888529ce286af22bccd997bd9
3
  size 10323922
SoccerTwos/events.out.tfevents.1710358561.stephan-ms7c02.36177.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:792f7edae81403905fc5199882d2424fca8d5b5a21404635a88621361bf9c398
3
+ size 1319
SoccerTwos/events.out.tfevents.1710358577.stephan-ms7c02.36326.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d76291da51fd3588d0e00aa3006735bc784ceabafc32923690126f5c039b7957
3
+ size 5082615
config.json CHANGED
@@ -1 +1 @@
1
- {"default_settings": null, "behaviors": {"SoccerTwos": {"trainer_type": "poca", "hyperparameters": {"batch_size": 4096, "buffer_size": 65536, "learning_rate": 0.0004345843188705317, "beta": 0.00019215097636640332, "epsilon": 0.15831928707038231, "lambd": 0.9467147291117369, "num_epoch": 5, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 500000, "network_settings": {"normalize": true, "hidden_units": 256, "num_layers": 3, "vis_encode_type": "fully_connected", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.9608227414353802, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 5, "even_checkpoints": false, "max_steps": 10000000, "time_horizon": 32, "summary_freq": 10000, "threaded": false, "self_play": {"save_steps": 60000, "team_change": 589998, "swap_steps": 70000, "window": 25, "play_against_latest_model_ratio": 0.75, "initial_elo": 1200.0}, "behavioral_cloning": null}}, "env_settings": {"env_path": "./ml-agents/training-envs-executables/SoccerTwos.exe", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 1280, "height": 720, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": false, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SoccerTwos-read-deal", "initialize_from": null, "load_model": false, "resume": true, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}
 
1
+ {"default_settings": null, "behaviors": {"SoccerTwos": {"trainer_type": "poca", "hyperparameters": {"batch_size": 4096, "buffer_size": 65536, "learning_rate": 0.0004345843188705317, "beta": 0.00019215097636640332, "epsilon": 0.15831928707038231, "lambd": 0.9467147291117369, "num_epoch": 5, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 500000, "network_settings": {"normalize": true, "hidden_units": 256, "num_layers": 3, "vis_encode_type": "fully_connected", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.9608227414353802, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 5, "even_checkpoints": false, "max_steps": 15000000, "time_horizon": 32, "summary_freq": 10000, "threaded": false, "self_play": {"save_steps": 60000, "team_change": 589998, "swap_steps": 70000, "window": 25, "play_against_latest_model_ratio": 0.75, "initial_elo": 1200.0}, "behavioral_cloning": null}}, "env_settings": {"env_path": "./ml-agents/training-envs-executables/SoccerTwos.exe", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 1280, "height": 720, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": false, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SoccerTwos-read-deal", "initialize_from": null, "load_model": false, "resume": true, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}
configuration.yaml CHANGED
@@ -37,7 +37,7 @@ behaviors:
37
  init_path: null
38
  keep_checkpoints: 5
39
  even_checkpoints: false
40
- max_steps: 10000000
41
  time_horizon: 32
42
  summary_freq: 10000
43
  threaded: false
 
37
  init_path: null
38
  keep_checkpoints: 5
39
  even_checkpoints: false
40
+ max_steps: 15000000
41
  time_horizon: 32
42
  summary_freq: 10000
43
  threaded: false
run_logs/Player-0.log CHANGED
@@ -19,14 +19,14 @@ ns GL_ARB_stencil_texturing GL_ARB_sync GL_ARB_tessellation_shader GL_ARB_textur
19
  _buffer_object GL_ARB_vertex_shader GL_ARB_vertex_type_10f_11f_11f_rev GL_ARB_vertex_type_2_10_10_10_rev GL_ARB_viewport_array GL_ATI_blend_equation_separate GL_ATI_meminfo GL_ATI_texture_float GL_ATI_texture_mirror_once GL_EXT_EGL_image_storage GL_EXT_EGL_sync GL_EXT_abgr GL_EXT_blend_equation_separate GL_EXT_debug_label GL_EXT_demote_to_helper_invocation GL_EXT_depth_bounds_test GL_EXT_draw_buffers2 GL_EXT_draw_instanced GL_EXT_framebuffer_blit GL_EXT_framebuffer_multisample GL_EXT_framebuffer_multisample_blit_scaled GL_EXT_framebuffer_object GL_EXT_framebuffer_sRGB GL_EXT_memory_object GL_EXT_memory_object_fd GL_EXT_packed_depth_stencil GL_EXT_packed_float GL_EXT_pixel_buffer_object GL_EXT_polygon_offset_clamp GL_EXT_provoking_vertex GL_EXT_semaphore GL_EXT_semaphore_fd GL_EXT_shader_image_load_formatted GL_EXT_shader_image_load_store GL_EXT_shader_integer_mix GL_EXT_shader_samples_identical GL_EXT_texture_array GL_EXT_texture_compression_dxt1 GL_EXT_texture_compression_rgtc GL_EXT_texture_compression_s3t
20
  c GL_EXT_texture_filter_anisotropic GL_EXT_texture_integer GL_EXT_texture_mirror_clamp GL_EXT_texture_sRGB GL_EXT_texture_sRGB_R8 GL_EXT_texture_sRGB_decode GL_EXT_texture_shadow_lod GL_EXT_texture_shared_exponent GL_EXT_texture_snorm GL_EXT_texture_swizzle GL_EXT_timer_query GL_EXT_transform_feedback GL_EXT_vertex_array_bgra GL_EXT_vertex_attrib_64bit GL_EXT_window_rectangles GL_IBM_multimode_draw_arrays GL_INTEL_blackhole_render GL_KHR_blend_equation_advanced GL_KHR_context_flush_control GL_KHR_debug GL_KHR_no_error GL_KHR_parallel_shader_compile GL_KHR_robust_buffer_access_behavior GL_KHR_robustness GL_KHR_texture_compression_astc_ldr GL_KHR_texture_compression_astc_sliced_3d GL_MESA_framebuffer_flip_y GL_MESA_pack_invert GL_MESA_shader_integer_functions GL_MESA_texture_const_bandwidth GL_MESA_texture_signed_rgba GL_NVX_gpu_memory_info GL_NV_alpha_to_coverage_dither_control GL_NV_compute_shader_derivatives GL_NV_conditional_render GL_NV_copy_image GL_NV_depth_clamp GL_NV_packed_depth_stencil GL_NV_shader_
21
  atomic_int64 GL_NV_texture_barrier GL_NV_vdpau_interop GL_OES_EGL_image GL_S3_s3tc
22
- OPENGL LOG: Creating OpenGL 4.6 graphics device ; Context level <OpenGL 4.5> ; Context handle 22053744
23
  Begin MonoManager ReloadAssembly
24
- - Completed reload, in 0.092 seconds
25
  Default vsync count 1
26
  requesting resize 1280 x 720
27
  resizing window to 1280 x 720
28
  Desktop is 1920 x 1080 @ 60 Hz
29
- UnloadTime: 0.807040 ms
30
  Registered Communicator in Agent.
31
  Setting up 6 worker threads for Enlighten.
32
  requesting resize 1280 x 720
@@ -36,7 +36,7 @@ Memory Statistics:
36
  [ALLOC_TEMP_TLS] TLS Allocator
37
  StackAllocators :
38
  [ALLOC_TEMP_MAIN]
39
- Peak usage frame count: [8.0 KB-16.0 KB]: 62727 frames, [2.0 MB-4.0 MB]: 1 frames
40
  Initial Block Size 4.0 MB
41
  Current Block Size 4.0 MB
42
  Peak Allocated Bytes 2.1 MB
@@ -213,16 +213,16 @@ Memory Statistics:
213
  Used Block count 1
214
  Peak Allocated bytes 1.9 MB
215
  [ALLOC_DEFAULT_MAIN]
216
- Peak usage frame count: [8.0 MB-16.0 MB]: 62728 frames
217
  Requested Block Size 16.0 MB
218
  Peak Block count 1
219
- Peak Allocated memory 13.0 MB
220
  Peak Large allocation bytes 0 B
221
  [ALLOC_DEFAULT_THREAD]
222
- Peak usage frame count: [16.0 MB-32.0 MB]: 62728 frames
223
  Requested Block Size 16.0 MB
224
  Peak Block count 1
225
- Peak Allocated memory 28.7 MB
226
  Peak Large allocation bytes 16.0 MB
227
  [ALLOC_TEMP_JOB_1_FRAME]
228
  Initial Block Size 2.0 MB
@@ -251,13 +251,13 @@ Memory Statistics:
251
  Used Block count 1
252
  Peak Allocated bytes 1.9 MB
253
  [ALLOC_GFX_MAIN]
254
- Peak usage frame count: [32.0 KB-64.0 KB]: 62727 frames, [2.0 MB-4.0 MB]: 1 frames
255
  Requested Block Size 16.0 MB
256
  Peak Block count 1
257
  Peak Allocated memory 2.7 MB
258
  Peak Large allocation bytes 0 B
259
  [ALLOC_GFX_THREAD]
260
- Peak usage frame count: [128.0 KB-256.0 KB]: 62728 frames
261
  Requested Block Size 16.0 MB
262
  Peak Block count 1
263
  Peak Allocated memory 174.7 KB
@@ -269,13 +269,13 @@ Memory Statistics:
269
  Used Block count 1
270
  Peak Allocated bytes 1.9 MB
271
  [ALLOC_CACHEOBJECTS_MAIN]
272
- Peak usage frame count: [0.5 MB-1.0 MB]: 62727 frames, [1.0 MB-2.0 MB]: 1 frames
273
  Requested Block Size 4.0 MB
274
  Peak Block count 1
275
  Peak Allocated memory 1.2 MB
276
  Peak Large allocation bytes 0 B
277
  [ALLOC_CACHEOBJECTS_THREAD]
278
- Peak usage frame count: [4.0 MB-8.0 MB]: 62728 frames
279
  Requested Block Size 4.0 MB
280
  Peak Block count 2
281
  Peak Allocated memory 7.8 MB
@@ -287,13 +287,13 @@ Memory Statistics:
287
  Used Block count 1
288
  Peak Allocated bytes 1.9 MB
289
  [ALLOC_TYPETREE_MAIN]
290
- Peak usage frame count: [0-1.0 KB]: 62728 frames
291
  Requested Block Size 2.0 MB
292
  Peak Block count 1
293
  Peak Allocated memory 1.0 KB
294
  Peak Large allocation bytes 0 B
295
  [ALLOC_TYPETREE_THREAD]
296
- Peak usage frame count: [1.0 KB-2.0 KB]: 62727 frames, [2.0 KB-4.0 KB]: 1 frames
297
  Requested Block Size 2.0 MB
298
  Peak Block count 1
299
  Peak Allocated memory 2.2 KB
 
19
  _buffer_object GL_ARB_vertex_shader GL_ARB_vertex_type_10f_11f_11f_rev GL_ARB_vertex_type_2_10_10_10_rev GL_ARB_viewport_array GL_ATI_blend_equation_separate GL_ATI_meminfo GL_ATI_texture_float GL_ATI_texture_mirror_once GL_EXT_EGL_image_storage GL_EXT_EGL_sync GL_EXT_abgr GL_EXT_blend_equation_separate GL_EXT_debug_label GL_EXT_demote_to_helper_invocation GL_EXT_depth_bounds_test GL_EXT_draw_buffers2 GL_EXT_draw_instanced GL_EXT_framebuffer_blit GL_EXT_framebuffer_multisample GL_EXT_framebuffer_multisample_blit_scaled GL_EXT_framebuffer_object GL_EXT_framebuffer_sRGB GL_EXT_memory_object GL_EXT_memory_object_fd GL_EXT_packed_depth_stencil GL_EXT_packed_float GL_EXT_pixel_buffer_object GL_EXT_polygon_offset_clamp GL_EXT_provoking_vertex GL_EXT_semaphore GL_EXT_semaphore_fd GL_EXT_shader_image_load_formatted GL_EXT_shader_image_load_store GL_EXT_shader_integer_mix GL_EXT_shader_samples_identical GL_EXT_texture_array GL_EXT_texture_compression_dxt1 GL_EXT_texture_compression_rgtc GL_EXT_texture_compression_s3t
20
  c GL_EXT_texture_filter_anisotropic GL_EXT_texture_integer GL_EXT_texture_mirror_clamp GL_EXT_texture_sRGB GL_EXT_texture_sRGB_R8 GL_EXT_texture_sRGB_decode GL_EXT_texture_shadow_lod GL_EXT_texture_shared_exponent GL_EXT_texture_snorm GL_EXT_texture_swizzle GL_EXT_timer_query GL_EXT_transform_feedback GL_EXT_vertex_array_bgra GL_EXT_vertex_attrib_64bit GL_EXT_window_rectangles GL_IBM_multimode_draw_arrays GL_INTEL_blackhole_render GL_KHR_blend_equation_advanced GL_KHR_context_flush_control GL_KHR_debug GL_KHR_no_error GL_KHR_parallel_shader_compile GL_KHR_robust_buffer_access_behavior GL_KHR_robustness GL_KHR_texture_compression_astc_ldr GL_KHR_texture_compression_astc_sliced_3d GL_MESA_framebuffer_flip_y GL_MESA_pack_invert GL_MESA_shader_integer_functions GL_MESA_texture_const_bandwidth GL_MESA_texture_signed_rgba GL_NVX_gpu_memory_info GL_NV_alpha_to_coverage_dither_control GL_NV_compute_shader_derivatives GL_NV_conditional_render GL_NV_copy_image GL_NV_depth_clamp GL_NV_packed_depth_stencil GL_NV_shader_
21
  atomic_int64 GL_NV_texture_barrier GL_NV_vdpau_interop GL_OES_EGL_image GL_S3_s3tc
22
+ OPENGL LOG: Creating OpenGL 4.6 graphics device ; Context level <OpenGL 4.5> ; Context handle 28321776
23
  Begin MonoManager ReloadAssembly
24
+ - Completed reload, in 0.091 seconds
25
  Default vsync count 1
26
  requesting resize 1280 x 720
27
  resizing window to 1280 x 720
28
  Desktop is 1920 x 1080 @ 60 Hz
29
+ UnloadTime: 0.942291 ms
30
  Registered Communicator in Agent.
31
  Setting up 6 worker threads for Enlighten.
32
  requesting resize 1280 x 720
 
36
  [ALLOC_TEMP_TLS] TLS Allocator
37
  StackAllocators :
38
  [ALLOC_TEMP_MAIN]
39
+ Peak usage frame count: [8.0 KB-16.0 KB]: 93732 frames, [2.0 MB-4.0 MB]: 1 frames
40
  Initial Block Size 4.0 MB
41
  Current Block Size 4.0 MB
42
  Peak Allocated Bytes 2.1 MB
 
213
  Used Block count 1
214
  Peak Allocated bytes 1.9 MB
215
  [ALLOC_DEFAULT_MAIN]
216
+ Peak usage frame count: [8.0 MB-16.0 MB]: 93733 frames
217
  Requested Block Size 16.0 MB
218
  Peak Block count 1
219
+ Peak Allocated memory 12.9 MB
220
  Peak Large allocation bytes 0 B
221
  [ALLOC_DEFAULT_THREAD]
222
+ Peak usage frame count: [16.0 MB-32.0 MB]: 93733 frames
223
  Requested Block Size 16.0 MB
224
  Peak Block count 1
225
+ Peak Allocated memory 28.8 MB
226
  Peak Large allocation bytes 16.0 MB
227
  [ALLOC_TEMP_JOB_1_FRAME]
228
  Initial Block Size 2.0 MB
 
251
  Used Block count 1
252
  Peak Allocated bytes 1.9 MB
253
  [ALLOC_GFX_MAIN]
254
+ Peak usage frame count: [32.0 KB-64.0 KB]: 93732 frames, [2.0 MB-4.0 MB]: 1 frames
255
  Requested Block Size 16.0 MB
256
  Peak Block count 1
257
  Peak Allocated memory 2.7 MB
258
  Peak Large allocation bytes 0 B
259
  [ALLOC_GFX_THREAD]
260
+ Peak usage frame count: [128.0 KB-256.0 KB]: 93733 frames
261
  Requested Block Size 16.0 MB
262
  Peak Block count 1
263
  Peak Allocated memory 174.7 KB
 
269
  Used Block count 1
270
  Peak Allocated bytes 1.9 MB
271
  [ALLOC_CACHEOBJECTS_MAIN]
272
+ Peak usage frame count: [0.5 MB-1.0 MB]: 93732 frames, [1.0 MB-2.0 MB]: 1 frames
273
  Requested Block Size 4.0 MB
274
  Peak Block count 1
275
  Peak Allocated memory 1.2 MB
276
  Peak Large allocation bytes 0 B
277
  [ALLOC_CACHEOBJECTS_THREAD]
278
+ Peak usage frame count: [4.0 MB-8.0 MB]: 93733 frames
279
  Requested Block Size 4.0 MB
280
  Peak Block count 2
281
  Peak Allocated memory 7.8 MB
 
287
  Used Block count 1
288
  Peak Allocated bytes 1.9 MB
289
  [ALLOC_TYPETREE_MAIN]
290
+ Peak usage frame count: [0-1.0 KB]: 93733 frames
291
  Requested Block Size 2.0 MB
292
  Peak Block count 1
293
  Peak Allocated memory 1.0 KB
294
  Peak Large allocation bytes 0 B
295
  [ALLOC_TYPETREE_THREAD]
296
+ Peak usage frame count: [1.0 KB-2.0 KB]: 93732 frames, [2.0 KB-4.0 KB]: 1 frames
297
  Requested Block Size 2.0 MB
298
  Peak Block count 1
299
  Peak Allocated memory 2.2 KB
run_logs/timers.json CHANGED
@@ -2,201 +2,201 @@
2
  "name": "root",
3
  "gauges": {
4
  "SoccerTwos.Policy.Entropy.mean": {
5
- "value": 1.4048619270324707,
6
- "min": 1.3750499486923218,
7
- "max": 1.7051565647125244,
8
- "count": 335
9
  },
10
  "SoccerTwos.Policy.Entropy.sum": {
11
- "value": 28277.060546875,
12
- "min": 14701.9814453125,
13
- "max": 34322.671875,
14
- "count": 335
15
  },
16
  "SoccerTwos.Environment.EpisodeLength.mean": {
17
- "value": 45.06422018348624,
18
- "min": 35.125,
19
- "max": 53.40425531914894,
20
- "count": 335
21
  },
22
  "SoccerTwos.Environment.EpisodeLength.sum": {
23
- "value": 19648.0,
24
- "min": 8072.0,
25
- "max": 20960.0,
26
- "count": 335
27
  },
28
  "SoccerTwos.Self-play.ELO.mean": {
29
- "value": 1607.9046472284606,
30
- "min": 1555.6832652825399,
31
- "max": 1613.038356436412,
32
- "count": 335
33
  },
34
  "SoccerTwos.Self-play.ELO.sum": {
35
- "value": 350523.2130958044,
36
- "min": 163654.2453609866,
37
- "max": 434134.2547516843,
38
- "count": 335
39
  },
40
  "SoccerTwos.Step.mean": {
41
- "value": 9999982.0,
42
- "min": 6659988.0,
43
- "max": 9999982.0,
44
- "count": 335
45
  },
46
  "SoccerTwos.Step.sum": {
47
- "value": 9999982.0,
48
- "min": 6659988.0,
49
- "max": 9999982.0,
50
- "count": 335
51
  },
52
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
53
- "value": 0.03223046660423279,
54
- "min": -0.11106479167938232,
55
- "max": 0.10332842171192169,
56
- "count": 335
57
  },
58
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
59
- "value": 13.246722221374512,
60
- "min": -46.31401824951172,
61
- "max": 44.017906188964844,
62
- "count": 335
63
  },
64
  "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
65
- "value": 0.031953852623701096,
66
- "min": -0.11250180751085281,
67
- "max": 0.10477326810359955,
68
- "count": 335
69
  },
70
  "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
71
- "value": 13.133033752441406,
72
- "min": -46.91325378417969,
73
- "max": 44.6334114074707,
74
- "count": 335
75
  },
76
  "SoccerTwos.Environment.CumulativeReward.mean": {
77
  "value": 0.0,
78
  "min": 0.0,
79
  "max": 0.0,
80
- "count": 335
81
  },
82
  "SoccerTwos.Environment.CumulativeReward.sum": {
83
  "value": 0.0,
84
  "min": 0.0,
85
  "max": 0.0,
86
- "count": 335
87
  },
88
  "SoccerTwos.Policy.ExtrinsicReward.mean": {
89
- "value": 0.09531192604554903,
90
- "min": -0.381275439994377,
91
- "max": 0.26663347656634745,
92
- "count": 335
93
  },
94
  "SoccerTwos.Policy.ExtrinsicReward.sum": {
95
- "value": 20.777999877929688,
96
- "min": -86.93080031871796,
97
- "max": 62.125600039958954,
98
- "count": 335
99
  },
100
  "SoccerTwos.Environment.GroupCumulativeReward.mean": {
101
- "value": 0.09531192604554903,
102
- "min": -0.381275439994377,
103
- "max": 0.26663347656634745,
104
- "count": 335
105
  },
106
  "SoccerTwos.Environment.GroupCumulativeReward.sum": {
107
- "value": 20.777999877929688,
108
- "min": -86.93080031871796,
109
- "max": 62.125600039958954,
110
- "count": 335
111
  },
112
  "SoccerTwos.IsTraining.mean": {
113
  "value": 1.0,
114
  "min": 1.0,
115
  "max": 1.0,
116
- "count": 335
117
  },
118
  "SoccerTwos.IsTraining.sum": {
119
  "value": 1.0,
120
  "min": 1.0,
121
  "max": 1.0,
122
- "count": 335
123
  },
124
  "SoccerTwos.Losses.PolicyLoss.mean": {
125
- "value": 0.01046212162455049,
126
- "min": 0.009879295097471185,
127
- "max": 0.014559235423075734,
128
- "count": 51
129
  },
130
  "SoccerTwos.Losses.PolicyLoss.sum": {
131
- "value": 0.01046212162455049,
132
- "min": 0.009879295097471185,
133
- "max": 0.014559235423075734,
134
- "count": 51
135
  },
136
  "SoccerTwos.Losses.ValueLoss.mean": {
137
- "value": 0.05891079842112958,
138
- "min": 0.04971672408282757,
139
- "max": 0.05918900854885578,
140
- "count": 51
141
  },
142
  "SoccerTwos.Losses.ValueLoss.sum": {
143
- "value": 0.05891079842112958,
144
- "min": 0.04971672408282757,
145
- "max": 0.05918900854885578,
146
- "count": 51
147
  },
148
  "SoccerTwos.Losses.BaselineLoss.mean": {
149
- "value": 0.05924153439700604,
150
- "min": 0.051102403877303006,
151
- "max": 0.05954511137679219,
152
- "count": 51
153
  },
154
  "SoccerTwos.Losses.BaselineLoss.sum": {
155
- "value": 0.05924153439700604,
156
- "min": 0.051102403877303006,
157
- "max": 0.05954511137679219,
158
- "count": 51
159
  },
160
  "SoccerTwos.Policy.LearningRate.mean": {
161
- "value": 6.4449295954992225e-09,
162
- "min": 6.4449295954992225e-09,
163
- "max": 0.00014248644558948728,
164
- "count": 51
165
  },
166
  "SoccerTwos.Policy.LearningRate.sum": {
167
- "value": 6.4449295954992225e-09,
168
- "min": 6.4449295954992225e-09,
169
- "max": 0.00014248644558948728,
170
- "count": 51
171
  },
172
  "SoccerTwos.Policy.Epsilon.mean": {
173
- "value": 0.10000085146159124,
174
- "min": 0.10000085146159124,
175
- "max": 0.11912103967704953,
176
- "count": 51
177
  },
178
  "SoccerTwos.Policy.Epsilon.sum": {
179
- "value": 0.10000085146159124,
180
- "min": 0.10000085146159124,
181
- "max": 0.11912103967704953,
182
- "count": 51
183
  },
184
  "SoccerTwos.Policy.Beta.mean": {
185
- "value": 1.0002659404254946e-05,
186
- "min": 1.0002659404254946e-05,
187
- "max": 6.972151274949521e-05,
188
- "count": 51
189
  },
190
  "SoccerTwos.Policy.Beta.sum": {
191
- "value": 1.0002659404254946e-05,
192
- "min": 1.0002659404254946e-05,
193
- "max": 6.972151274949521e-05,
194
- "count": 51
195
  }
196
  },
197
  "metadata": {
198
  "timer_format_version": "0.1.0",
199
- "start_time_seconds": "1710343829",
200
  "python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
201
  "command_line_arguments": "/home/stephan/.conda/envs/rl/bin/mlagents-learn ./ml-agents/config/poca/SoccerTwos.yaml --env=./ml-agents/training-envs-executables/SoccerTwos.exe --run-id=SoccerTwos-read-deal --width=1280 --height=720 --resume",
202
  "mlagents_version": "1.1.0.dev0",
@@ -204,59 +204,59 @@
204
  "communication_protocol_version": "1.5.0",
205
  "pytorch_version": "2.2.1+cu121",
206
  "numpy_version": "1.23.5",
207
- "end_time_seconds": "1710353568"
208
  },
209
- "total": 9739.254863360999,
210
  "count": 1,
211
- "self": 0.270132729987381,
212
  "children": {
213
  "run_training.setup": {
214
- "total": 0.018506341002648696,
215
  "count": 1,
216
- "self": 0.018506341002648696
217
  },
218
  "TrainerController.start_learning": {
219
- "total": 9738.966224290009,
220
  "count": 1,
221
- "self": 4.652608350283117,
222
  "children": {
223
  "TrainerController._reset_env": {
224
- "total": 4.244304390012985,
225
- "count": 7,
226
- "self": 4.244304390012985
227
  },
228
  "TrainerController.advance": {
229
- "total": 9729.947026144713,
230
- "count": 239073,
231
- "self": 4.148107524248189,
232
  "children": {
233
  "env_step": {
234
- "total": 4354.3673745146225,
235
- "count": 239073,
236
- "self": 3721.0493522615725,
237
  "children": {
238
  "SubprocessEnvManager._take_step": {
239
- "total": 630.4299217515072,
240
- "count": 239073,
241
- "self": 19.02124206413282,
242
  "children": {
243
  "TorchPolicy.evaluate": {
244
- "total": 611.4086796873744,
245
- "count": 418182,
246
- "self": 611.4086796873744
247
  }
248
  }
249
  },
250
  "workers": {
251
- "total": 2.8881005015427945,
252
- "count": 239073,
253
  "self": 0.0,
254
  "children": {
255
  "worker_root": {
256
- "total": 9731.739510110943,
257
- "count": 239073,
258
  "is_parallel": true,
259
- "self": 6533.360267171403,
260
  "children": {
261
  "run_training.setup": {
262
  "total": 0.0,
@@ -265,48 +265,48 @@
265
  "self": 0.0,
266
  "children": {
267
  "steps_from_proto": {
268
- "total": 0.06389564499841072,
269
  "count": 2,
270
  "is_parallel": true,
271
- "self": 0.000593470991589129,
272
  "children": {
273
  "_process_rank_one_or_two_observation": {
274
- "total": 0.06330217400682159,
275
  "count": 8,
276
  "is_parallel": true,
277
- "self": 0.06330217400682159
278
  }
279
  }
280
  },
281
  "UnityEnvironment.step": {
282
- "total": 0.02612613000383135,
283
  "count": 1,
284
  "is_parallel": true,
285
- "self": 0.000600070008658804,
286
  "children": {
287
  "UnityEnvironment._generate_step_input": {
288
- "total": 0.00040655999328009784,
289
  "count": 1,
290
  "is_parallel": true,
291
- "self": 0.00040655999328009784
292
  },
293
  "communicator.exchange": {
294
- "total": 0.02343449799809605,
295
  "count": 1,
296
  "is_parallel": true,
297
- "self": 0.02343449799809605
298
  },
299
  "steps_from_proto": {
300
- "total": 0.0016850020037963986,
301
  "count": 2,
302
  "is_parallel": true,
303
- "self": 0.0003057300054933876,
304
  "children": {
305
  "_process_rank_one_or_two_observation": {
306
- "total": 0.001379271998303011,
307
  "count": 8,
308
  "is_parallel": true,
309
- "self": 0.001379271998303011
310
  }
311
  }
312
  }
@@ -315,48 +315,48 @@
315
  }
316
  },
317
  "steps_from_proto": {
318
- "total": 0.012151043978519738,
319
- "count": 12,
320
  "is_parallel": true,
321
- "self": 0.002059131977148354,
322
  "children": {
323
  "_process_rank_one_or_two_observation": {
324
- "total": 0.010091912001371384,
325
- "count": 48,
326
  "is_parallel": true,
327
- "self": 0.010091912001371384
328
  }
329
  }
330
  },
331
  "UnityEnvironment.step": {
332
- "total": 3198.3670918955613,
333
- "count": 239072,
334
  "is_parallel": true,
335
- "self": 175.16570653802773,
336
  "children": {
337
  "UnityEnvironment._generate_step_input": {
338
- "total": 110.43290661888022,
339
- "count": 239072,
340
  "is_parallel": true,
341
- "self": 110.43290661888022
342
  },
343
  "communicator.exchange": {
344
- "total": 2470.8126502879313,
345
- "count": 239072,
346
  "is_parallel": true,
347
- "self": 2470.8126502879313
348
  },
349
  "steps_from_proto": {
350
- "total": 441.95582845072204,
351
- "count": 478144,
352
  "is_parallel": true,
353
- "self": 78.3687699053844,
354
  "children": {
355
  "_process_rank_one_or_two_observation": {
356
- "total": 363.58705854533764,
357
- "count": 1912576,
358
  "is_parallel": true,
359
- "self": 363.58705854533764
360
  }
361
  }
362
  }
@@ -369,31 +369,31 @@
369
  }
370
  },
371
  "trainer_advance": {
372
- "total": 5371.4315441058425,
373
- "count": 239073,
374
- "self": 26.83088273082103,
375
  "children": {
376
  "process_trajectory": {
377
- "total": 1094.2377518599678,
378
- "count": 239073,
379
- "self": 1093.3974272879568,
380
  "children": {
381
  "RLTrainer._checkpoint": {
382
- "total": 0.8403245720110135,
383
- "count": 7,
384
- "self": 0.8403245720110135
385
  }
386
  }
387
  },
388
  "_update_policy": {
389
- "total": 4250.362909515054,
390
- "count": 51,
391
- "self": 652.032682771809,
392
  "children": {
393
  "TorchPOCAOptimizer.update": {
394
- "total": 3598.3302267432446,
395
- "count": 4080,
396
- "self": 3598.3302267432446
397
  }
398
  }
399
  }
@@ -402,19 +402,19 @@
402
  }
403
  },
404
  "trainer_threads": {
405
- "total": 9.200011845678091e-07,
406
  "count": 1,
407
- "self": 9.200011845678091e-07
408
  },
409
  "TrainerController._save_models": {
410
- "total": 0.12228448499809019,
411
  "count": 1,
412
- "self": 0.0026952329935738817,
413
  "children": {
414
  "RLTrainer._checkpoint": {
415
- "total": 0.11958925200451631,
416
  "count": 1,
417
- "self": 0.11958925200451631
418
  }
419
  }
420
  }
 
2
  "name": "root",
3
  "gauges": {
4
  "SoccerTwos.Policy.Entropy.mean": {
5
+ "value": 1.11602783203125,
6
+ "min": 1.1030526161193848,
7
+ "max": 1.4285537004470825,
8
+ "count": 500
9
  },
10
  "SoccerTwos.Policy.Entropy.sum": {
11
+ "value": 22320.556640625,
12
+ "min": 21029.970703125,
13
+ "max": 28662.501953125,
14
+ "count": 500
15
  },
16
  "SoccerTwos.Environment.EpisodeLength.mean": {
17
+ "value": 45.905660377358494,
18
+ "min": 35.28,
19
+ "max": 55.38202247191011,
20
+ "count": 500
21
  },
22
  "SoccerTwos.Environment.EpisodeLength.sum": {
23
+ "value": 19464.0,
24
+ "min": 14112.0,
25
+ "max": 21312.0,
26
+ "count": 500
27
  },
28
  "SoccerTwos.Self-play.ELO.mean": {
29
+ "value": 1672.5986965358836,
30
+ "min": 1594.9761687604023,
31
+ "max": 1684.8696129621046,
32
+ "count": 500
33
  },
34
  "SoccerTwos.Self-play.ELO.sum": {
35
+ "value": 354590.92366560735,
36
+ "min": 291606.7260394614,
37
+ "max": 450906.7595913422,
38
+ "count": 500
39
  },
40
  "SoccerTwos.Step.mean": {
41
+ "value": 14999982.0,
42
+ "min": 10009972.0,
43
+ "max": 14999982.0,
44
+ "count": 500
45
  },
46
  "SoccerTwos.Step.sum": {
47
+ "value": 14999982.0,
48
+ "min": 10009972.0,
49
+ "max": 14999982.0,
50
+ "count": 500
51
  },
52
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
53
+ "value": -0.033846165984869,
54
+ "min": -0.10714015364646912,
55
+ "max": 0.09757562726736069,
56
+ "count": 500
57
  },
58
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
59
+ "value": -13.876928329467773,
60
+ "min": -45.2131462097168,
61
+ "max": 41.95751953125,
62
+ "count": 500
63
  },
64
  "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
65
+ "value": -0.03533671796321869,
66
+ "min": -0.11142526566982269,
67
+ "max": 0.10013997554779053,
68
+ "count": 500
69
  },
70
  "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
71
+ "value": -14.488054275512695,
72
+ "min": -47.021461486816406,
73
+ "max": 43.06018829345703,
74
+ "count": 500
75
  },
76
  "SoccerTwos.Environment.CumulativeReward.mean": {
77
  "value": 0.0,
78
  "min": 0.0,
79
  "max": 0.0,
80
+ "count": 500
81
  },
82
  "SoccerTwos.Environment.CumulativeReward.sum": {
83
  "value": 0.0,
84
  "min": 0.0,
85
  "max": 0.0,
86
+ "count": 500
87
  },
88
  "SoccerTwos.Policy.ExtrinsicReward.mean": {
89
+ "value": -0.07970754661650029,
90
+ "min": -0.26102524301380786,
91
+ "max": 0.3510517215934293,
92
+ "count": 500
93
  },
94
  "SoccerTwos.Policy.ExtrinsicReward.sum": {
95
+ "value": -16.89799988269806,
96
+ "min": -55.66319966316223,
97
+ "max": 81.4439994096756,
98
+ "count": 500
99
  },
100
  "SoccerTwos.Environment.GroupCumulativeReward.mean": {
101
+ "value": -0.07970754661650029,
102
+ "min": -0.26102524301380786,
103
+ "max": 0.3510517215934293,
104
+ "count": 500
105
  },
106
  "SoccerTwos.Environment.GroupCumulativeReward.sum": {
107
+ "value": -16.89799988269806,
108
+ "min": -55.66319966316223,
109
+ "max": 81.4439994096756,
110
+ "count": 500
111
  },
112
  "SoccerTwos.IsTraining.mean": {
113
  "value": 1.0,
114
  "min": 1.0,
115
  "max": 1.0,
116
+ "count": 500
117
  },
118
  "SoccerTwos.IsTraining.sum": {
119
  "value": 1.0,
120
  "min": 1.0,
121
  "max": 1.0,
122
+ "count": 500
123
  },
124
  "SoccerTwos.Losses.PolicyLoss.mean": {
125
+ "value": 0.012091718217061499,
126
+ "min": 0.009822013491066173,
127
+ "max": 0.015032402960059699,
128
+ "count": 76
129
  },
130
  "SoccerTwos.Losses.PolicyLoss.sum": {
131
+ "value": 0.012091718217061499,
132
+ "min": 0.009822013491066173,
133
+ "max": 0.015032402960059699,
134
+ "count": 76
135
  },
136
  "SoccerTwos.Losses.ValueLoss.mean": {
137
+ "value": 0.05806648256257176,
138
+ "min": 0.05226881531998515,
139
+ "max": 0.059615218080580235,
140
+ "count": 76
141
  },
142
  "SoccerTwos.Losses.ValueLoss.sum": {
143
+ "value": 0.05806648256257176,
144
+ "min": 0.05226881531998515,
145
+ "max": 0.059615218080580235,
146
+ "count": 76
147
  },
148
  "SoccerTwos.Losses.BaselineLoss.mean": {
149
+ "value": 0.05836009904742241,
150
+ "min": 0.0542876117862761,
151
+ "max": 0.06110596880316734,
152
+ "count": 76
153
  },
154
  "SoccerTwos.Losses.BaselineLoss.sum": {
155
+ "value": 0.05836009904742241,
156
+ "min": 0.0542876117862761,
157
+ "max": 0.06110596880316734,
158
+ "count": 76
159
  },
160
  "SoccerTwos.Policy.LearningRate.mean": {
161
+ "value": 4.0553810392494676e-07,
162
+ "min": 4.0553810392494676e-07,
163
+ "max": 0.0001428860023203168,
164
+ "count": 76
165
  },
166
  "SoccerTwos.Policy.LearningRate.sum": {
167
+ "value": 4.0553810392494676e-07,
168
+ "min": 4.0553810392494676e-07,
169
+ "max": 0.0001428860023203168,
170
+ "count": 76
171
  },
172
  "SoccerTwos.Policy.Epsilon.mean": {
173
+ "value": 0.10005440800688417,
174
+ "min": 0.10005440800688417,
175
+ "max": 0.11917465842958205,
176
+ "count": 76
177
  },
178
  "SoccerTwos.Policy.Epsilon.sum": {
179
+ "value": 0.10005440800688417,
180
+ "min": 0.10005440800688417,
181
+ "max": 0.11917465842958205,
182
+ "count": 76
183
  },
184
  "SoccerTwos.Policy.Beta.mean": {
185
+ "value": 1.0169934717551432e-05,
186
+ "min": 1.0169934717551432e-05,
187
+ "max": 6.988898235716646e-05,
188
+ "count": 76
189
  },
190
  "SoccerTwos.Policy.Beta.sum": {
191
+ "value": 1.0169934717551432e-05,
192
+ "min": 1.0169934717551432e-05,
193
+ "max": 6.988898235716646e-05,
194
+ "count": 76
195
  }
196
  },
197
  "metadata": {
198
  "timer_format_version": "0.1.0",
199
+ "start_time_seconds": "1710358573",
200
  "python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
201
  "command_line_arguments": "/home/stephan/.conda/envs/rl/bin/mlagents-learn ./ml-agents/config/poca/SoccerTwos.yaml --env=./ml-agents/training-envs-executables/SoccerTwos.exe --run-id=SoccerTwos-read-deal --width=1280 --height=720 --resume",
202
  "mlagents_version": "1.1.0.dev0",
 
204
  "communication_protocol_version": "1.5.0",
205
  "pytorch_version": "2.2.1+cu121",
206
  "numpy_version": "1.23.5",
207
+ "end_time_seconds": "1710372965"
208
  },
209
+ "total": 14392.268066103992,
210
  "count": 1,
211
+ "self": 0.3203680879960302,
212
  "children": {
213
  "run_training.setup": {
214
+ "total": 0.017996288996073417,
215
  "count": 1,
216
+ "self": 0.017996288996073417
217
  },
218
  "TrainerController.start_learning": {
219
+ "total": 14391.929701727,
220
  "count": 1,
221
+ "self": 7.222826109427842,
222
  "children": {
223
  "TrainerController._reset_env": {
224
+ "total": 4.3356985290010925,
225
+ "count": 10,
226
+ "self": 4.3356985290010925
227
  },
228
  "TrainerController.advance": {
229
+ "total": 14380.252779454575,
230
+ "count": 357131,
231
+ "self": 6.432589866788476,
232
  "children": {
233
  "env_step": {
234
+ "total": 6466.631959918537,
235
+ "count": 357131,
236
+ "self": 5498.500712261317,
237
  "children": {
238
  "SubprocessEnvManager._take_step": {
239
+ "total": 963.7606686544896,
240
+ "count": 357131,
241
+ "self": 29.2971219017345,
242
  "children": {
243
  "TorchPolicy.evaluate": {
244
+ "total": 934.4635467527551,
245
+ "count": 624880,
246
+ "self": 934.4635467527551
247
  }
248
  }
249
  },
250
  "workers": {
251
+ "total": 4.370579002730665,
252
+ "count": 357131,
253
  "self": 0.0,
254
  "children": {
255
  "worker_root": {
256
+ "total": 14380.838316511697,
257
+ "count": 357131,
258
  "is_parallel": true,
259
+ "self": 9673.599672775075,
260
  "children": {
261
  "run_training.setup": {
262
  "total": 0.0,
 
265
  "self": 0.0,
266
  "children": {
267
  "steps_from_proto": {
268
+ "total": 0.06619343400234357,
269
  "count": 2,
270
  "is_parallel": true,
271
+ "self": 0.0004880309716099873,
272
  "children": {
273
  "_process_rank_one_or_two_observation": {
274
+ "total": 0.06570540303073358,
275
  "count": 8,
276
  "is_parallel": true,
277
+ "self": 0.06570540303073358
278
  }
279
  }
280
  },
281
  "UnityEnvironment.step": {
282
+ "total": 0.027265490003628656,
283
  "count": 1,
284
  "is_parallel": true,
285
+ "self": 0.0006784550059819594,
286
  "children": {
287
  "UnityEnvironment._generate_step_input": {
288
+ "total": 0.0004930220020469278,
289
  "count": 1,
290
  "is_parallel": true,
291
+ "self": 0.0004930220020469278
292
  },
293
  "communicator.exchange": {
294
+ "total": 0.024494213997968473,
295
  "count": 1,
296
  "is_parallel": true,
297
+ "self": 0.024494213997968473
298
  },
299
  "steps_from_proto": {
300
+ "total": 0.0015997989976312965,
301
  "count": 2,
302
  "is_parallel": true,
303
+ "self": 0.00032821799686644226,
304
  "children": {
305
  "_process_rank_one_or_two_observation": {
306
+ "total": 0.0012715810007648543,
307
  "count": 8,
308
  "is_parallel": true,
309
+ "self": 0.0012715810007648543
310
  }
311
  }
312
  }
 
315
  }
316
  },
317
  "steps_from_proto": {
318
+ "total": 0.018047201985609718,
319
+ "count": 18,
320
  "is_parallel": true,
321
+ "self": 0.0030916809337213635,
322
  "children": {
323
  "_process_rank_one_or_two_observation": {
324
+ "total": 0.014955521051888354,
325
+ "count": 72,
326
  "is_parallel": true,
327
+ "self": 0.014955521051888354
328
  }
329
  }
330
  },
331
  "UnityEnvironment.step": {
332
+ "total": 4707.220596534637,
333
+ "count": 357130,
334
  "is_parallel": true,
335
+ "self": 257.41373912687413,
336
  "children": {
337
  "UnityEnvironment._generate_step_input": {
338
+ "total": 162.74674167780904,
339
+ "count": 357130,
340
  "is_parallel": true,
341
+ "self": 162.74674167780904
342
  },
343
  "communicator.exchange": {
344
+ "total": 3645.2510425291694,
345
+ "count": 357130,
346
  "is_parallel": true,
347
+ "self": 3645.2510425291694
348
  },
349
  "steps_from_proto": {
350
+ "total": 641.809073200784,
351
+ "count": 714260,
352
  "is_parallel": true,
353
+ "self": 114.93468356617086,
354
  "children": {
355
  "_process_rank_one_or_two_observation": {
356
+ "total": 526.8743896346132,
357
+ "count": 2857040,
358
  "is_parallel": true,
359
+ "self": 526.8743896346132
360
  }
361
  }
362
  }
 
369
  }
370
  },
371
  "trainer_advance": {
372
+ "total": 7907.188229669249,
373
+ "count": 357131,
374
+ "self": 41.56422363645106,
375
  "children": {
376
  "process_trajectory": {
377
+ "total": 1667.4114032577781,
378
+ "count": 357131,
379
+ "self": 1666.2047581057705,
380
  "children": {
381
  "RLTrainer._checkpoint": {
382
+ "total": 1.2066451520076953,
383
+ "count": 10,
384
+ "self": 1.2066451520076953
385
  }
386
  }
387
  },
388
  "_update_policy": {
389
+ "total": 6198.21260277502,
390
+ "count": 76,
391
+ "self": 967.3907746167824,
392
  "children": {
393
  "TorchPOCAOptimizer.update": {
394
+ "total": 5230.821828158238,
395
+ "count": 6080,
396
+ "self": 5230.821828158238
397
  }
398
  }
399
  }
 
402
  }
403
  },
404
  "trainer_threads": {
405
+ "total": 7.199996616691351e-07,
406
  "count": 1,
407
+ "self": 7.199996616691351e-07
408
  },
409
  "TrainerController._save_models": {
410
+ "total": 0.11839691399654839,
411
  "count": 1,
412
+ "self": 0.0024417589884251356,
413
  "children": {
414
  "RLTrainer._checkpoint": {
415
+ "total": 0.11595515500812326,
416
  "count": 1,
417
+ "self": 0.11595515500812326
418
  }
419
  }
420
  }
run_logs/training_status.json CHANGED
@@ -2,59 +2,59 @@
2
  "SoccerTwos": {
3
  "checkpoints": [
4
  {
5
- "steps": 8499978,
6
- "file_path": "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-8499978.onnx",
7
  "reward": 0.0,
8
- "creation_time": 1710349255.752344,
9
  "auxillary_file_paths": [
10
- "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-8499978.pt"
11
  ]
12
  },
13
  {
14
- "steps": 8999988,
15
- "file_path": "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-8999988.onnx",
16
  "reward": 0.0,
17
- "creation_time": 1710350638.0742688,
18
  "auxillary_file_paths": [
19
- "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-8999988.pt"
20
  ]
21
  },
22
  {
23
- "steps": 9499993,
24
- "file_path": "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-9499993.onnx",
25
  "reward": 0.0,
26
- "creation_time": 1710352100.153916,
27
  "auxillary_file_paths": [
28
- "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-9499993.pt"
29
  ]
30
  },
31
  {
32
- "steps": 9999982,
33
- "file_path": "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-9999982.onnx",
34
- "reward": null,
35
- "creation_time": 1710353568.109763,
36
  "auxillary_file_paths": [
37
- "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-9999982.pt"
38
  ]
39
  },
40
  {
41
- "steps": 10000046,
42
- "file_path": "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-10000046.onnx",
43
- "reward": null,
44
- "creation_time": 1710353568.2486105,
45
  "auxillary_file_paths": [
46
- "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-10000046.pt"
47
  ]
48
  }
49
  ],
50
- "elo": 1607.9046472284606,
51
  "final_checkpoint": {
52
- "steps": 10000046,
53
  "file_path": "results/SoccerTwos-read-deal/SoccerTwos.onnx",
54
- "reward": null,
55
- "creation_time": 1710353568.2486105,
56
  "auxillary_file_paths": [
57
- "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-10000046.pt"
58
  ]
59
  }
60
  },
 
2
  "SoccerTwos": {
3
  "checkpoints": [
4
  {
5
+ "steps": 13499994,
6
+ "file_path": "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-13499994.onnx",
7
  "reward": 0.0,
8
+ "creation_time": 1710368642.601263,
9
  "auxillary_file_paths": [
10
+ "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-13499994.pt"
11
  ]
12
  },
13
  {
14
+ "steps": 13999986,
15
+ "file_path": "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-13999986.onnx",
16
  "reward": 0.0,
17
+ "creation_time": 1710370035.9879289,
18
  "auxillary_file_paths": [
19
+ "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-13999986.pt"
20
  ]
21
  },
22
  {
23
+ "steps": 14499998,
24
+ "file_path": "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-14499998.onnx",
25
  "reward": 0.0,
26
+ "creation_time": 1710371506.4123518,
27
  "auxillary_file_paths": [
28
+ "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-14499998.pt"
29
  ]
30
  },
31
  {
32
+ "steps": 14999982,
33
+ "file_path": "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-14999982.onnx",
34
+ "reward": 0.0,
35
+ "creation_time": 1710372965.343914,
36
  "auxillary_file_paths": [
37
+ "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-14999982.pt"
38
  ]
39
  },
40
  {
41
+ "steps": 15000014,
42
+ "file_path": "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-15000014.onnx",
43
+ "reward": 0.0,
44
+ "creation_time": 1710372965.4699337,
45
  "auxillary_file_paths": [
46
+ "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-15000014.pt"
47
  ]
48
  }
49
  ],
50
+ "elo": 1672.598696535884,
51
  "final_checkpoint": {
52
+ "steps": 15000014,
53
  "file_path": "results/SoccerTwos-read-deal/SoccerTwos.onnx",
54
+ "reward": 0.0,
55
+ "creation_time": 1710372965.4699337,
56
  "auxillary_file_paths": [
57
+ "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-15000014.pt"
58
  ]
59
  }
60
  },