tresbien1 commited on
Commit
b01519e
1 Parent(s): b52f016

Second, improved training of PyramidsRDS with PPO

Browse files
Pyramids.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3395dfc05a3eb245da447c483971f7847b23dc78d8ba60e6d7e23333f993321b
3
  size 1420238
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:315caf35221e6c229abfb8a3cfc48a204b94f96d74a66fc38239e889edaf8b48
3
  size 1420238
Pyramids/Pyramids-1000030.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:315caf35221e6c229abfb8a3cfc48a204b94f96d74a66fc38239e889edaf8b48
3
+ size 1420238
Pyramids/Pyramids-1000030.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1e4cf84038d7aa3c8c4ff3c4d787619b5ad1ee21fcb7f5bc69ee9d5f627c9ec
3
+ size 8656252
Pyramids/Pyramids-499955.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a99372cfce9169c815d0dcea84c1271ac84cabbc467ad50c2372c7ebda3440d4
3
+ size 1420238
Pyramids/Pyramids-499955.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e1b1b490260e53933a76a213ce6bff1bbafdeb8d60ef616d32f812a6cd48a0a
3
+ size 8656173
Pyramids/Pyramids-999902.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:315caf35221e6c229abfb8a3cfc48a204b94f96d74a66fc38239e889edaf8b48
3
+ size 1420238
Pyramids/Pyramids-999902.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e03c0ce1ef2f5038b555895acff7c989120c2ad0bd7b7edfaa51694e1eb89af
3
+ size 8656173
Pyramids/checkpoint.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:278a2e9d11e0f557d47c982fad4a0cc22ea05974cf9d1a1c3cd0d4f6152ac321
3
  size 8655778
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb1e4ad310148fa1e31d0824d72b72f388888adb49ab4e5942dcfa7069c0c029
3
  size 8655778
Pyramids/events.out.tfevents.1704275893.a76fab4c855c.18344.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7c5baf706decfc6ea17208680fac0cb2716dd9c69354e37cd125e994f03252e
3
+ size 198670
config.json CHANGED
@@ -1 +1 @@
1
- {"default_settings": null, "behaviors": {"Pyramids": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 128, "buffer_size": 2048, "learning_rate": 0.0003, "beta": 0.01, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 500000, "network_settings": {"normalize": false, "hidden_units": 512, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.95, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}, "rnd": {"gamma": 0.94, "strength": 0.01, "network_settings": {"normalize": false, "hidden_units": 64, "num_layers": 3, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "learning_rate": 0.0001, "encoding_size": null}}, "init_path": null, "keep_checkpoints": 5, "even_checkpoints": false, "max_steps": 1000000, "time_horizon": 128, "summary_freq": 50000, "threaded": false, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/Pyramids/Pyramids", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "Pyramids Training-2", "initialize_from": null, "load_model": false, "resume": false, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}
 
1
+ {"default_settings": null, "behaviors": {"Pyramids": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 128, "buffer_size": 2048, "learning_rate": 0.0003, "beta": 0.01, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 500000, "network_settings": {"normalize": false, "hidden_units": 512, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}, "rnd": {"gamma": 0.99, "strength": 0.01, "network_settings": {"normalize": false, "hidden_units": 64, "num_layers": 3, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "learning_rate": 0.0001, "encoding_size": null}}, "init_path": null, "keep_checkpoints": 5, "even_checkpoints": false, "max_steps": 1000000, "time_horizon": 128, "summary_freq": 50000, "threaded": false, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/Pyramids/Pyramids", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "Pyramids Training-3", "initialize_from": null, "load_model": false, "resume": false, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}
configuration.yaml CHANGED
@@ -25,7 +25,7 @@ behaviors:
25
  deterministic: false
26
  reward_signals:
27
  extrinsic:
28
- gamma: 0.95
29
  strength: 1.0
30
  network_settings:
31
  normalize: false
@@ -36,7 +36,7 @@ behaviors:
36
  goal_conditioning_type: hyper
37
  deterministic: false
38
  rnd:
39
- gamma: 0.94
40
  strength: 0.01
41
  network_settings:
42
  normalize: false
@@ -79,7 +79,7 @@ engine_settings:
79
  no_graphics_monitor: false
80
  environment_parameters: null
81
  checkpoint_settings:
82
- run_id: Pyramids Training-2
83
  initialize_from: null
84
  load_model: false
85
  resume: false
 
25
  deterministic: false
26
  reward_signals:
27
  extrinsic:
28
+ gamma: 0.99
29
  strength: 1.0
30
  network_settings:
31
  normalize: false
 
36
  goal_conditioning_type: hyper
37
  deterministic: false
38
  rnd:
39
+ gamma: 0.99
40
  strength: 0.01
41
  network_settings:
42
  normalize: false
 
79
  no_graphics_monitor: false
80
  environment_parameters: null
81
  checkpoint_settings:
82
+ run_id: Pyramids Training-3
83
  initialize_from: null
84
  load_model: false
85
  resume: false
run_logs/Player-0.log CHANGED
@@ -1,7 +1,7 @@
1
  Mono path[0] = '/content/ml-agents/training-envs-executables/linux/Pyramids/Pyramids_Data/Managed'
2
  Mono config path = '/content/ml-agents/training-envs-executables/linux/Pyramids/Pyramids_Data/MonoBleedingEdge/etc'
3
  Found 1 interfaces on host : 0) 172.28.0.12
4
- Multi-casting "[IP] 172.28.0.12 [Port] 55334 [Flags] 2 [Guid] 1589326979 [EditorId] 764847374 [Version] 1048832 [Id] LinuxPlayer(13,172.28.0.12) [Debug] 0 [PackageName] LinuxPlayer [ProjectName] UnityEnvironment" to [225.0.0.222:54997]...
5
  Preloaded 'lib_burst_generated.so'
6
  Preloaded 'libgrpc_csharp_ext.x64.so'
7
  Initialize engine version: 2021.3.5f1 (40eb3a945986)
@@ -33,7 +33,7 @@ ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM default
33
  FMOD failed to initialize the output device.: "Error initializing output device. " (60)
34
  FMOD initialized on nosound output
35
  Begin MonoManager ReloadAssembly
36
- - Completed reload, in 0.192 seconds
37
  ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
38
  ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
39
  ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
@@ -65,7 +65,7 @@ ERROR: Shader Standard shader is not supported on this GPU (none of subshaders/f
65
  WARNING: Shader Unsupported: 'Standard' - All subshaders removed
66
  WARNING: Shader Did you use #pragma only_renderers and omit this platform?
67
  WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
68
- UnloadTime: 1.130649 ms
69
  ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
70
  requesting resize 84 x 84
71
  Setting up 1 worker threads for Enlighten.
@@ -73,7 +73,7 @@ PlayerConnection::CleanupMemory Statistics:
73
  [ALLOC_TEMP_TLS] TLS Allocator
74
  StackAllocators :
75
  [ALLOC_TEMP_MAIN]
76
- Peak usage frame count: [16.0 KB-32.0 KB]: 7292 frames, [32.0 KB-64.0 KB]: 10155 frames, [64.0 KB-128.0 KB]: 1317 frames, [2.0 MB-4.0 MB]: 1 frames
77
  Initial Block Size 4.0 MB
78
  Current Block Size 4.0 MB
79
  Peak Allocated Bytes 2.0 MB
@@ -123,17 +123,17 @@ PlayerConnection::CleanupMemory Statistics:
123
  Current Block Size 64.0 KB
124
  Peak Allocated Bytes 0 B
125
  Overflow Count 0
126
- [ALLOC_TEMP_Background Job.Worker 15]
127
  Initial Block Size 32.0 KB
128
  Current Block Size 32.0 KB
129
  Peak Allocated Bytes 0 B
130
  Overflow Count 0
131
- [ALLOC_TEMP_Background Job.Worker 2]
132
  Initial Block Size 32.0 KB
133
  Current Block Size 32.0 KB
134
  Peak Allocated Bytes 0 B
135
  Overflow Count 0
136
- [ALLOC_TEMP_Background Job.Worker 7]
137
  Initial Block Size 32.0 KB
138
  Current Block Size 32.0 KB
139
  Peak Allocated Bytes 0 B
@@ -146,7 +146,7 @@ PlayerConnection::CleanupMemory Statistics:
146
  [ALLOC_TEMP_Profiler.Dispatcher]
147
  Initial Block Size 64.0 KB
148
  Current Block Size 64.0 KB
149
- Peak Allocated Bytes 240 B
150
  Overflow Count 0
151
  [ALLOC_TEMP_Background Job.Worker 12]
152
  Initial Block Size 32.0 KB
@@ -204,28 +204,28 @@ PlayerConnection::CleanupMemory Statistics:
204
  Peak Allocated Bytes 128 B
205
  Overflow Count 0
206
  [ALLOC_MEMORYPROFILER]
207
- Peak usage frame count: [0.5 MB-1.0 MB]: 299 frames, [1.0 MB-2.0 MB]: 18466 frames
208
  Requested Block Size 1.0 MB
209
  Peak Block count 2
210
  Peak Allocated memory 1.6 MB
211
  Peak Large allocation bytes 0 B
212
  [ALLOC_DEFAULT] Dual Thread Allocator
213
- Peak main deferred allocation count 11658
214
  [ALLOC_BUCKET]
215
  Large Block size 4.0 MB
216
  Used Block count 1
217
  Peak Allocated bytes 1.7 MB
218
  [ALLOC_DEFAULT_MAIN]
219
- Peak usage frame count: [8.0 MB-16.0 MB]: 1 frames, [16.0 MB-32.0 MB]: 18764 frames
220
  Requested Block Size 16.0 MB
221
  Peak Block count 3
222
- Peak Allocated memory 30.9 MB
223
  Peak Large allocation bytes 0 B
224
  [ALLOC_DEFAULT_THREAD]
225
- Peak usage frame count: [16.0 MB-32.0 MB]: 18765 frames
226
  Requested Block Size 16.0 MB
227
  Peak Block count 1
228
- Peak Allocated memory 23.6 MB
229
  Peak Large allocation bytes 16.0 MB
230
  [ALLOC_TEMP_JOB_1_FRAME]
231
  Initial Block Size 2.0 MB
@@ -254,13 +254,13 @@ PlayerConnection::CleanupMemory Statistics:
254
  Used Block count 1
255
  Peak Allocated bytes 1.7 MB
256
  [ALLOC_GFX_MAIN]
257
- Peak usage frame count: [32.0 KB-64.0 KB]: 18764 frames, [64.0 KB-128.0 KB]: 1 frames
258
  Requested Block Size 16.0 MB
259
  Peak Block count 1
260
  Peak Allocated memory 67.0 KB
261
  Peak Large allocation bytes 0 B
262
  [ALLOC_GFX_THREAD]
263
- Peak usage frame count: [64.0 KB-128.0 KB]: 18765 frames
264
  Requested Block Size 16.0 MB
265
  Peak Block count 1
266
  Peak Allocated memory 67.7 KB
@@ -272,16 +272,16 @@ PlayerConnection::CleanupMemory Statistics:
272
  Used Block count 1
273
  Peak Allocated bytes 1.7 MB
274
  [ALLOC_CACHEOBJECTS_MAIN]
275
- Peak usage frame count: [0.5 MB-1.0 MB]: 299 frames, [1.0 MB-2.0 MB]: 18466 frames
276
  Requested Block Size 4.0 MB
277
  Peak Block count 1
278
  Peak Allocated memory 1.4 MB
279
  Peak Large allocation bytes 0 B
280
  [ALLOC_CACHEOBJECTS_THREAD]
281
- Peak usage frame count: [1.0 MB-2.0 MB]: 18764 frames, [4.0 MB-8.0 MB]: 1 frames
282
  Requested Block Size 4.0 MB
283
  Peak Block count 2
284
- Peak Allocated memory 4.6 MB
285
  Peak Large allocation bytes 0 B
286
  [ALLOC_TYPETREE] Dual Thread Allocator
287
  Peak main deferred allocation count 0
@@ -290,25 +290,25 @@ PlayerConnection::CleanupMemory Statistics:
290
  Used Block count 1
291
  Peak Allocated bytes 1.7 MB
292
  [ALLOC_TYPETREE_MAIN]
293
- Peak usage frame count: [0-1.0 KB]: 18765 frames
294
  Requested Block Size 2.0 MB
295
  Peak Block count 1
296
  Peak Allocated memory 1.0 KB
297
  Peak Large allocation bytes 0 B
298
  [ALLOC_TYPETREE_THREAD]
299
- Peak usage frame count: [1.0 KB-2.0 KB]: 18765 frames
300
  Requested Block Size 2.0 MB
301
  Peak Block count 1
302
  Peak Allocated memory 1.9 KB
303
  Peak Large allocation bytes 0 B
304
  [ALLOC_PROFILER]
305
- Peak usage frame count: [16.0 KB-32.0 KB]: 18765 frames
306
  Requested Block Size 16.0 MB
307
  Peak Block count 1
308
- Peak Allocated memory 29.2 KB
309
  Peak Large allocation bytes 0 B
310
  [ALLOC_PROFILER_BUCKET]
311
  Large Block size 4.0 MB
312
  Used Block count 1
313
  Peak Allocated bytes 396 B
314
- ##utp:{"type":"MemoryLeaks","version":2,"phase":"Immediate","time":1704275352635,"processId":7898,"allocatedMemory":1970133,"memoryLabels":[{"Default":9033},{"Permanent":1264},{"NewDelete":12801},{"Thread":34460},{"Manager":10603},{"VertexData":12},{"Geometry":280},{"Texture":16},{"Shader":69173},{"Material":24},{"GfxDevice":35248},{"Animation":304},{"Audio":3976},{"Physics":288},{"Serialization":216},{"Input":9176},{"JobScheduler":200},{"Mono":40},{"ScriptingNativeRuntime":216},{"BaseObject":1609212},{"Resource":592},{"Renderer":1936},{"Transform":48},{"File":800},{"WebCam":24},{"Culling":40},{"Terrain":953},{"Wind":24},{"String":3447},{"DynamicArray":30868},{"HashMap":7680},{"Utility":1360},{"PoolAlloc":1160},{"TypeTree":1792},{"ScriptManager":80},{"RuntimeInitializeOnLoadManager":72},{"SpriteAtlas":112},{"GI":3272},{"Unet":16},{"Director":7760},{"WebRequest":720},{"VR":45473},{"SceneManager":424},{"Video":32},{"LazyScriptCache":32},{"NativeArray":384},{"Camera":25},{"Secure":1},{"SerializationCache":624},{"APIUpdating":5872},{"Subsystems":384},{"VirtualTexturing":57552},{"AssetReference":32}]}
 
1
  Mono path[0] = '/content/ml-agents/training-envs-executables/linux/Pyramids/Pyramids_Data/Managed'
2
  Mono config path = '/content/ml-agents/training-envs-executables/linux/Pyramids/Pyramids_Data/MonoBleedingEdge/etc'
3
  Found 1 interfaces on host : 0) 172.28.0.12
4
+ Multi-casting "[IP] 172.28.0.12 [Port] 55435 [Flags] 2 [Guid] 2233454501 [EditorId] 764847374 [Version] 1048832 [Id] LinuxPlayer(13,172.28.0.12) [Debug] 0 [PackageName] LinuxPlayer [ProjectName] UnityEnvironment" to [225.0.0.222:54997]...
5
  Preloaded 'lib_burst_generated.so'
6
  Preloaded 'libgrpc_csharp_ext.x64.so'
7
  Initialize engine version: 2021.3.5f1 (40eb3a945986)
 
33
  FMOD failed to initialize the output device.: "Error initializing output device. " (60)
34
  FMOD initialized on nosound output
35
  Begin MonoManager ReloadAssembly
36
+ - Completed reload, in 0.107 seconds
37
  ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
38
  ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
39
  ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 
65
  WARNING: Shader Unsupported: 'Standard' - All subshaders removed
66
  WARNING: Shader Did you use #pragma only_renderers and omit this platform?
67
  WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
68
+ UnloadTime: 0.874010 ms
69
  ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
70
  requesting resize 84 x 84
71
  Setting up 1 worker threads for Enlighten.
 
73
  [ALLOC_TEMP_TLS] TLS Allocator
74
  StackAllocators :
75
  [ALLOC_TEMP_MAIN]
76
+ Peak usage frame count: [16.0 KB-32.0 KB]: 4076 frames, [32.0 KB-64.0 KB]: 12111 frames, [64.0 KB-128.0 KB]: 2578 frames, [2.0 MB-4.0 MB]: 1 frames
77
  Initial Block Size 4.0 MB
78
  Current Block Size 4.0 MB
79
  Peak Allocated Bytes 2.0 MB
 
123
  Current Block Size 64.0 KB
124
  Peak Allocated Bytes 0 B
125
  Overflow Count 0
126
+ [ALLOC_TEMP_Background Job.Worker 2]
127
  Initial Block Size 32.0 KB
128
  Current Block Size 32.0 KB
129
  Peak Allocated Bytes 0 B
130
  Overflow Count 0
131
+ [ALLOC_TEMP_Background Job.Worker 7]
132
  Initial Block Size 32.0 KB
133
  Current Block Size 32.0 KB
134
  Peak Allocated Bytes 0 B
135
  Overflow Count 0
136
+ [ALLOC_TEMP_Background Job.Worker 15]
137
  Initial Block Size 32.0 KB
138
  Current Block Size 32.0 KB
139
  Peak Allocated Bytes 0 B
 
146
  [ALLOC_TEMP_Profiler.Dispatcher]
147
  Initial Block Size 64.0 KB
148
  Current Block Size 64.0 KB
149
+ Peak Allocated Bytes 480 B
150
  Overflow Count 0
151
  [ALLOC_TEMP_Background Job.Worker 12]
152
  Initial Block Size 32.0 KB
 
204
  Peak Allocated Bytes 128 B
205
  Overflow Count 0
206
  [ALLOC_MEMORYPROFILER]
207
+ Peak usage frame count: [0.5 MB-1.0 MB]: 299 frames, [1.0 MB-2.0 MB]: 18467 frames
208
  Requested Block Size 1.0 MB
209
  Peak Block count 2
210
  Peak Allocated memory 1.6 MB
211
  Peak Large allocation bytes 0 B
212
  [ALLOC_DEFAULT] Dual Thread Allocator
213
+ Peak main deferred allocation count 13249
214
  [ALLOC_BUCKET]
215
  Large Block size 4.0 MB
216
  Used Block count 1
217
  Peak Allocated bytes 1.7 MB
218
  [ALLOC_DEFAULT_MAIN]
219
+ Peak usage frame count: [8.0 MB-16.0 MB]: 1 frames, [16.0 MB-32.0 MB]: 18765 frames
220
  Requested Block Size 16.0 MB
221
  Peak Block count 3
222
+ Peak Allocated memory 31.3 MB
223
  Peak Large allocation bytes 0 B
224
  [ALLOC_DEFAULT_THREAD]
225
+ Peak usage frame count: [16.0 MB-32.0 MB]: 18766 frames
226
  Requested Block Size 16.0 MB
227
  Peak Block count 1
228
+ Peak Allocated memory 22.3 MB
229
  Peak Large allocation bytes 16.0 MB
230
  [ALLOC_TEMP_JOB_1_FRAME]
231
  Initial Block Size 2.0 MB
 
254
  Used Block count 1
255
  Peak Allocated bytes 1.7 MB
256
  [ALLOC_GFX_MAIN]
257
+ Peak usage frame count: [32.0 KB-64.0 KB]: 18765 frames, [64.0 KB-128.0 KB]: 1 frames
258
  Requested Block Size 16.0 MB
259
  Peak Block count 1
260
  Peak Allocated memory 67.0 KB
261
  Peak Large allocation bytes 0 B
262
  [ALLOC_GFX_THREAD]
263
+ Peak usage frame count: [64.0 KB-128.0 KB]: 18766 frames
264
  Requested Block Size 16.0 MB
265
  Peak Block count 1
266
  Peak Allocated memory 67.7 KB
 
272
  Used Block count 1
273
  Peak Allocated bytes 1.7 MB
274
  [ALLOC_CACHEOBJECTS_MAIN]
275
+ Peak usage frame count: [0.5 MB-1.0 MB]: 299 frames, [1.0 MB-2.0 MB]: 18467 frames
276
  Requested Block Size 4.0 MB
277
  Peak Block count 1
278
  Peak Allocated memory 1.4 MB
279
  Peak Large allocation bytes 0 B
280
  [ALLOC_CACHEOBJECTS_THREAD]
281
+ Peak usage frame count: [1.0 MB-2.0 MB]: 18765 frames, [4.0 MB-8.0 MB]: 1 frames
282
  Requested Block Size 4.0 MB
283
  Peak Block count 2
284
+ Peak Allocated memory 4.7 MB
285
  Peak Large allocation bytes 0 B
286
  [ALLOC_TYPETREE] Dual Thread Allocator
287
  Peak main deferred allocation count 0
 
290
  Used Block count 1
291
  Peak Allocated bytes 1.7 MB
292
  [ALLOC_TYPETREE_MAIN]
293
+ Peak usage frame count: [0-1.0 KB]: 18766 frames
294
  Requested Block Size 2.0 MB
295
  Peak Block count 1
296
  Peak Allocated memory 1.0 KB
297
  Peak Large allocation bytes 0 B
298
  [ALLOC_TYPETREE_THREAD]
299
+ Peak usage frame count: [1.0 KB-2.0 KB]: 18766 frames
300
  Requested Block Size 2.0 MB
301
  Peak Block count 1
302
  Peak Allocated memory 1.9 KB
303
  Peak Large allocation bytes 0 B
304
  [ALLOC_PROFILER]
305
+ Peak usage frame count: [16.0 KB-32.0 KB]: 18766 frames
306
  Requested Block Size 16.0 MB
307
  Peak Block count 1
308
+ Peak Allocated memory 29.1 KB
309
  Peak Large allocation bytes 0 B
310
  [ALLOC_PROFILER_BUCKET]
311
  Large Block size 4.0 MB
312
  Used Block count 1
313
  Peak Allocated bytes 396 B
314
+ ##utp:{"type":"MemoryLeaks","version":2,"phase":"Immediate","time":1704278030062,"processId":18361,"allocatedMemory":1970133,"memoryLabels":[{"Default":9033},{"Permanent":1264},{"NewDelete":12801},{"Thread":34460},{"Manager":10603},{"VertexData":12},{"Geometry":280},{"Texture":16},{"Shader":69173},{"Material":24},{"GfxDevice":35248},{"Animation":304},{"Audio":3976},{"Physics":288},{"Serialization":216},{"Input":9176},{"JobScheduler":200},{"Mono":40},{"ScriptingNativeRuntime":216},{"BaseObject":1609212},{"Resource":592},{"Renderer":1936},{"Transform":48},{"File":800},{"WebCam":24},{"Culling":40},{"Terrain":953},{"Wind":24},{"String":3447},{"DynamicArray":30868},{"HashMap":7680},{"Utility":1360},{"PoolAlloc":1160},{"TypeTree":1792},{"ScriptManager":80},{"RuntimeInitializeOnLoadManager":72},{"SpriteAtlas":112},{"GI":3272},{"Unet":16},{"Director":7760},{"WebRequest":720},{"VR":45473},{"SceneManager":424},{"Video":32},{"LazyScriptCache":32},{"NativeArray":384},{"Camera":25},{"Secure":1},{"SerializationCache":624},{"APIUpdating":5872},{"Subsystems":384},{"VirtualTexturing":57552},{"AssetReference":32}]}
run_logs/timers.json CHANGED
@@ -2,171 +2,171 @@
2
  "name": "root",
3
  "gauges": {
4
  "Pyramids.Policy.Entropy.mean": {
5
- "value": 0.5983927845954895,
6
- "min": 0.5983927845954895,
7
- "max": 1.343400001525879,
8
  "count": 20
9
  },
10
  "Pyramids.Policy.Entropy.sum": {
11
- "value": 29986.66015625,
12
- "min": 29986.66015625,
13
- "max": 67234.484375,
14
  "count": 20
15
  },
16
  "Pyramids.Step.mean": {
17
- "value": 999925.0,
18
- "min": 49878.0,
19
- "max": 999925.0,
20
  "count": 20
21
  },
22
  "Pyramids.Step.sum": {
23
- "value": 999925.0,
24
- "min": 49878.0,
25
- "max": 999925.0,
26
  "count": 20
27
  },
28
  "Pyramids.Policy.ExtrinsicValueEstimate.mean": {
29
- "value": -0.013876122422516346,
30
- "min": -0.030839893966913223,
31
- "max": -0.00945535209029913,
32
  "count": 20
33
  },
34
  "Pyramids.Policy.ExtrinsicValueEstimate.sum": {
35
- "value": -5.5782012939453125,
36
- "min": -12.3051176071167,
37
- "max": -3.81050705909729,
38
  "count": 20
39
  },
40
  "Pyramids.Policy.RndValueEstimate.mean": {
41
- "value": 0.0029050002340227365,
42
- "min": -0.00022533306037075818,
43
- "max": 0.08890791237354279,
44
  "count": 20
45
  },
46
  "Pyramids.Policy.RndValueEstimate.sum": {
47
- "value": 1.167810082435608,
48
- "min": -0.09035855531692505,
49
- "max": 35.47425842285156,
50
  "count": 20
51
  },
52
  "Pyramids.Losses.PolicyLoss.mean": {
53
- "value": 0.06579226099424805,
54
- "min": 0.06512104197606153,
55
- "max": 0.07199981855150664,
56
  "count": 20
57
  },
58
  "Pyramids.Losses.PolicyLoss.sum": {
59
- "value": 1.513222002867705,
60
- "min": 0.8930364629323959,
61
- "max": 1.6477607740883151,
62
  "count": 20
63
  },
64
  "Pyramids.Losses.ValueLoss.mean": {
65
- "value": 0.0009892530458551413,
66
- "min": 0.0001602431029824168,
67
- "max": 0.0037391359524955254,
68
  "count": 20
69
  },
70
  "Pyramids.Losses.ValueLoss.sum": {
71
- "value": 0.02275282005466825,
72
- "min": 0.0035253482656131697,
73
- "max": 0.04860876738244183,
74
  "count": 20
75
  },
76
  "Pyramids.Policy.LearningRate.mean": {
77
- "value": 7.53210618498261e-06,
78
- "min": 7.53210618498261e-06,
79
- "max": 0.0002917810642781077,
80
  "count": 20
81
  },
82
  "Pyramids.Policy.LearningRate.sum": {
83
- "value": 0.00017323844225460003,
84
- "min": 0.00017323844225460003,
85
- "max": 0.005768409877196799,
86
  "count": 20
87
  },
88
  "Pyramids.Policy.Epsilon.mean": {
89
- "value": 0.1025106695652174,
90
- "min": 0.1025106695652174,
91
- "max": 0.19726035384615387,
92
  "count": 20
93
  },
94
  "Pyramids.Policy.Epsilon.sum": {
95
- "value": 2.3577454,
96
- "min": 2.3577454,
97
- "max": 4.1228032,
98
  "count": 20
99
  },
100
  "Pyramids.Policy.Beta.mean": {
101
- "value": 0.00026081588956521746,
102
- "min": 0.00026081588956521746,
103
- "max": 0.00972630934923077,
104
  "count": 20
105
  },
106
  "Pyramids.Policy.Beta.sum": {
107
- "value": 0.005998765460000001,
108
- "min": 0.005998765460000001,
109
- "max": 0.19230803968000001,
110
  "count": 20
111
  },
112
  "Pyramids.Losses.RNDLoss.mean": {
113
- "value": 0.01551153976470232,
114
- "min": 0.01551153976470232,
115
- "max": 0.3107236623764038,
116
  "count": 20
117
  },
118
  "Pyramids.Losses.RNDLoss.sum": {
119
- "value": 0.35676541924476624,
120
- "min": 0.35676541924476624,
121
- "max": 4.039407730102539,
122
  "count": 20
123
  },
124
  "Pyramids.Environment.EpisodeLength.mean": {
125
- "value": 972.5098039215686,
126
- "min": 946.2692307692307,
127
- "max": 996.0416666666666,
128
  "count": 20
129
  },
130
  "Pyramids.Environment.EpisodeLength.sum": {
131
- "value": 49598.0,
132
- "min": 47237.0,
133
- "max": 56043.0,
134
  "count": 20
135
  },
136
  "Pyramids.Environment.CumulativeReward.mean": {
137
- "value": -0.7378627939843664,
138
- "min": -0.9552083844318986,
139
- "max": -0.6432923601510433,
140
  "count": 20
141
  },
142
  "Pyramids.Environment.CumulativeReward.sum": {
143
- "value": -37.631002493202686,
144
- "min": -50.088402941823006,
145
- "max": -33.45120272785425,
146
  "count": 20
147
  },
148
  "Pyramids.Policy.ExtrinsicReward.mean": {
149
- "value": -0.7378627939843664,
150
- "min": -0.9552083844318986,
151
- "max": -0.6432923601510433,
152
  "count": 20
153
  },
154
  "Pyramids.Policy.ExtrinsicReward.sum": {
155
- "value": -37.631002493202686,
156
- "min": -50.088402941823006,
157
- "max": -33.45120272785425,
158
  "count": 20
159
  },
160
  "Pyramids.Policy.RndReward.mean": {
161
- "value": 0.15703592533428296,
162
- "min": 0.15624511372656202,
163
- "max": 4.615633514864991,
164
  "count": 20
165
  },
166
  "Pyramids.Policy.RndReward.sum": {
167
- "value": 8.00883219204843,
168
- "min": 8.00883219204843,
169
- "max": 221.55040871351957,
170
  "count": 20
171
  },
172
  "Pyramids.IsTraining.mean": {
@@ -184,67 +184,67 @@
184
  },
185
  "metadata": {
186
  "timer_format_version": "0.1.0",
187
- "start_time_seconds": "1704273359",
188
  "python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
189
- "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training-2 --no-graphics",
190
  "mlagents_version": "1.1.0.dev0",
191
  "mlagents_envs_version": "1.1.0.dev0",
192
  "communication_protocol_version": "1.5.0",
193
  "pytorch_version": "2.1.2+cu121",
194
  "numpy_version": "1.23.5",
195
- "end_time_seconds": "1704275352"
196
  },
197
- "total": 1993.154926618,
198
  "count": 1,
199
- "self": 0.48554877099991245,
200
  "children": {
201
  "run_training.setup": {
202
- "total": 0.06937176099995668,
203
  "count": 1,
204
- "self": 0.06937176099995668
205
  },
206
  "TrainerController.start_learning": {
207
- "total": 1992.6000060860001,
208
  "count": 1,
209
- "self": 1.4480502969940972,
210
  "children": {
211
  "TrainerController._reset_env": {
212
- "total": 2.673110766000036,
213
  "count": 1,
214
- "self": 2.673110766000036
215
  },
216
  "TrainerController.advance": {
217
- "total": 1988.394409740006,
218
- "count": 63030,
219
- "self": 1.4689806919566308,
220
  "children": {
221
  "env_step": {
222
- "total": 1358.9817631640058,
223
- "count": 63030,
224
- "self": 1225.942064266986,
225
  "children": {
226
  "SubprocessEnvManager._take_step": {
227
- "total": 132.17192505101366,
228
- "count": 63030,
229
- "self": 4.719373328042593,
230
  "children": {
231
  "TorchPolicy.evaluate": {
232
- "total": 127.45255172297107,
233
- "count": 62550,
234
- "self": 127.45255172297107
235
  }
236
  }
237
  },
238
  "workers": {
239
- "total": 0.8677738460060027,
240
- "count": 63030,
241
  "self": 0.0,
242
  "children": {
243
  "worker_root": {
244
- "total": 1987.4621567540394,
245
- "count": 63030,
246
  "is_parallel": true,
247
- "self": 880.5503308880463,
248
  "children": {
249
  "run_training.setup": {
250
  "total": 0.0,
@@ -253,48 +253,48 @@
253
  "self": 0.0,
254
  "children": {
255
  "steps_from_proto": {
256
- "total": 0.0022598160001052747,
257
  "count": 1,
258
  "is_parallel": true,
259
- "self": 0.0005843530000220198,
260
  "children": {
261
  "_process_rank_one_or_two_observation": {
262
- "total": 0.0016754630000832549,
263
  "count": 8,
264
  "is_parallel": true,
265
- "self": 0.0016754630000832549
266
  }
267
  }
268
  },
269
  "UnityEnvironment.step": {
270
- "total": 0.05077610300008928,
271
  "count": 1,
272
  "is_parallel": true,
273
- "self": 0.0006098310000197671,
274
  "children": {
275
  "UnityEnvironment._generate_step_input": {
276
- "total": 0.00048121800000444637,
277
  "count": 1,
278
  "is_parallel": true,
279
- "self": 0.00048121800000444637
280
  },
281
  "communicator.exchange": {
282
- "total": 0.047941176999984236,
283
  "count": 1,
284
  "is_parallel": true,
285
- "self": 0.047941176999984236
286
  },
287
  "steps_from_proto": {
288
- "total": 0.001743877000080829,
289
  "count": 1,
290
  "is_parallel": true,
291
- "self": 0.00037161100021876337,
292
  "children": {
293
  "_process_rank_one_or_two_observation": {
294
- "total": 0.0013722659998620657,
295
  "count": 8,
296
  "is_parallel": true,
297
- "self": 0.0013722659998620657
298
  }
299
  }
300
  }
@@ -303,34 +303,34 @@
303
  }
304
  },
305
  "UnityEnvironment.step": {
306
- "total": 1106.911825865993,
307
- "count": 63029,
308
  "is_parallel": true,
309
- "self": 34.95583143394447,
310
  "children": {
311
  "UnityEnvironment._generate_step_input": {
312
- "total": 24.578581023000424,
313
- "count": 63029,
314
  "is_parallel": true,
315
- "self": 24.578581023000424
316
  },
317
  "communicator.exchange": {
318
- "total": 948.7428121660562,
319
- "count": 63029,
320
  "is_parallel": true,
321
- "self": 948.7428121660562
322
  },
323
  "steps_from_proto": {
324
- "total": 98.63460124299195,
325
- "count": 63029,
326
  "is_parallel": true,
327
- "self": 19.71788833404821,
328
  "children": {
329
  "_process_rank_one_or_two_observation": {
330
- "total": 78.91671290894374,
331
- "count": 504232,
332
  "is_parallel": true,
333
- "self": 78.91671290894374
334
  }
335
  }
336
  }
@@ -343,31 +343,31 @@
343
  }
344
  },
345
  "trainer_advance": {
346
- "total": 627.9436658840436,
347
- "count": 63030,
348
- "self": 2.6710124700555298,
349
  "children": {
350
  "process_trajectory": {
351
- "total": 124.30694764398822,
352
- "count": 63030,
353
- "self": 124.06981375898795,
354
  "children": {
355
  "RLTrainer._checkpoint": {
356
- "total": 0.23713388500027577,
357
  "count": 2,
358
- "self": 0.23713388500027577
359
  }
360
  }
361
  },
362
  "_update_policy": {
363
- "total": 500.9657057699999,
364
- "count": 442,
365
- "self": 298.7058735060057,
366
  "children": {
367
  "TorchPPOOptimizer.update": {
368
- "total": 202.2598322639942,
369
- "count": 22710,
370
- "self": 202.2598322639942
371
  }
372
  }
373
  }
@@ -376,19 +376,19 @@
376
  }
377
  },
378
  "trainer_threads": {
379
- "total": 8.469996828353032e-07,
380
  "count": 1,
381
- "self": 8.469996828353032e-07
382
  },
383
  "TrainerController._save_models": {
384
- "total": 0.08443443600026512,
385
  "count": 1,
386
- "self": 0.001465669000026537,
387
  "children": {
388
  "RLTrainer._checkpoint": {
389
- "total": 0.08296876700023859,
390
  "count": 1,
391
- "self": 0.08296876700023859
392
  }
393
  }
394
  }
 
2
  "name": "root",
3
  "gauges": {
4
  "Pyramids.Policy.Entropy.mean": {
5
+ "value": 0.40660443902015686,
6
+ "min": 0.3838774263858795,
7
+ "max": 1.3838720321655273,
8
  "count": 20
9
  },
10
  "Pyramids.Policy.Entropy.sum": {
11
+ "value": 20323.716796875,
12
+ "min": 19058.74609375,
13
+ "max": 70632.828125,
14
  "count": 20
15
  },
16
  "Pyramids.Step.mean": {
17
+ "value": 999902.0,
18
+ "min": 49982.0,
19
+ "max": 999902.0,
20
  "count": 20
21
  },
22
  "Pyramids.Step.sum": {
23
+ "value": 999902.0,
24
+ "min": 49982.0,
25
+ "max": 999902.0,
26
  "count": 20
27
  },
28
  "Pyramids.Policy.ExtrinsicValueEstimate.mean": {
29
+ "value": 0.5106868147850037,
30
+ "min": -0.10902372002601624,
31
+ "max": 0.5106868147850037,
32
  "count": 20
33
  },
34
  "Pyramids.Policy.ExtrinsicValueEstimate.sum": {
35
+ "value": 230.8304443359375,
36
+ "min": -43.60948944091797,
37
+ "max": 230.8304443359375,
38
  "count": 20
39
  },
40
  "Pyramids.Policy.RndValueEstimate.mean": {
41
+ "value": 0.018002863973379135,
42
+ "min": 0.017526134848594666,
43
+ "max": 0.27170729637145996,
44
  "count": 20
45
  },
46
  "Pyramids.Policy.RndValueEstimate.sum": {
47
+ "value": 8.13729476928711,
48
+ "min": 7.298983573913574,
49
+ "max": 108.68292236328125,
50
  "count": 20
51
  },
52
  "Pyramids.Losses.PolicyLoss.mean": {
53
+ "value": 0.0690960958714177,
54
+ "min": 0.06685300014880363,
55
+ "max": 0.07348646662135302,
56
  "count": 20
57
  },
58
  "Pyramids.Losses.PolicyLoss.sum": {
59
+ "value": 1.6583063009140246,
60
+ "min": 1.0288105326989423,
61
+ "max": 1.7034627192473386,
62
  "count": 20
63
  },
64
  "Pyramids.Losses.ValueLoss.mean": {
65
+ "value": 0.015689400035530914,
66
+ "min": 0.0004058652203409273,
67
+ "max": 0.017001819814943114,
68
  "count": 20
69
  },
70
  "Pyramids.Losses.ValueLoss.sum": {
71
+ "value": 0.3765456008527419,
72
+ "min": 0.008697785586991082,
73
+ "max": 0.40804367555863474,
74
  "count": 20
75
  },
76
  "Pyramids.Policy.LearningRate.mean": {
77
+ "value": 7.360097546666664e-06,
78
+ "min": 7.360097546666664e-06,
79
+ "max": 0.00029159310280229997,
80
  "count": 20
81
  },
82
  "Pyramids.Policy.LearningRate.sum": {
83
+ "value": 0.00017664234111999994,
84
+ "min": 0.00017664234111999994,
85
+ "max": 0.0054513657828781995,
86
  "count": 20
87
  },
88
  "Pyramids.Policy.Epsilon.mean": {
89
+ "value": 0.10245333333333334,
90
+ "min": 0.10245333333333334,
91
+ "max": 0.1971977,
92
  "count": 20
93
  },
94
  "Pyramids.Policy.Epsilon.sum": {
95
+ "value": 2.45888,
96
+ "min": 2.45888,
97
+ "max": 4.0171218,
98
  "count": 20
99
  },
100
  "Pyramids.Policy.Beta.mean": {
101
+ "value": 0.00025508799999999994,
102
+ "min": 0.00025508799999999994,
103
+ "max": 0.00972005023,
104
  "count": 20
105
  },
106
  "Pyramids.Policy.Beta.sum": {
107
+ "value": 0.006122111999999999,
108
+ "min": 0.006122111999999999,
109
+ "max": 0.18175046781999998,
110
  "count": 20
111
  },
112
  "Pyramids.Losses.RNDLoss.mean": {
113
+ "value": 0.015770716592669487,
114
+ "min": 0.015770716592669487,
115
+ "max": 0.37413766980171204,
116
  "count": 20
117
  },
118
  "Pyramids.Losses.RNDLoss.sum": {
119
+ "value": 0.3784972131252289,
120
+ "min": 0.3784972131252289,
121
+ "max": 5.237927436828613,
122
  "count": 20
123
  },
124
  "Pyramids.Environment.EpisodeLength.mean": {
125
+ "value": 355.95620437956205,
126
+ "min": 355.95620437956205,
127
+ "max": 999.0,
128
  "count": 20
129
  },
130
  "Pyramids.Environment.EpisodeLength.sum": {
131
+ "value": 48766.0,
132
+ "min": 47053.0,
133
+ "max": 52985.0,
134
  "count": 20
135
  },
136
  "Pyramids.Environment.CumulativeReward.mean": {
137
+ "value": 1.5564291726281172,
138
+ "min": -1.0000000521540642,
139
+ "max": 1.5564291726281172,
140
  "count": 20
141
  },
142
  "Pyramids.Environment.CumulativeReward.sum": {
143
+ "value": 213.23079665005207,
144
+ "min": -48.00000250339508,
145
+ "max": 213.23079665005207,
146
  "count": 20
147
  },
148
  "Pyramids.Policy.ExtrinsicReward.mean": {
149
+ "value": 1.5564291726281172,
150
+ "min": -1.0000000521540642,
151
+ "max": 1.5564291726281172,
152
  "count": 20
153
  },
154
  "Pyramids.Policy.ExtrinsicReward.sum": {
155
+ "value": 213.23079665005207,
156
+ "min": -48.00000250339508,
157
+ "max": 213.23079665005207,
158
  "count": 20
159
  },
160
  "Pyramids.Policy.RndReward.mean": {
161
+ "value": 0.057838770586890624,
162
+ "min": 0.057838770586890624,
163
+ "max": 5.367142829267929,
164
  "count": 20
165
  },
166
  "Pyramids.Policy.RndReward.sum": {
167
+ "value": 7.923911570404016,
168
+ "min": 7.923911570404016,
169
+ "max": 257.6228558048606,
170
  "count": 20
171
  },
172
  "Pyramids.IsTraining.mean": {
 
184
  },
185
  "metadata": {
186
  "timer_format_version": "0.1.0",
187
+ "start_time_seconds": "1704275892",
188
  "python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
189
+ "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training-3 --no-graphics",
190
  "mlagents_version": "1.1.0.dev0",
191
  "mlagents_envs_version": "1.1.0.dev0",
192
  "communication_protocol_version": "1.5.0",
193
  "pytorch_version": "2.1.2+cu121",
194
  "numpy_version": "1.23.5",
195
+ "end_time_seconds": "1704278030"
196
  },
197
+ "total": 2138.0222330259994,
198
  "count": 1,
199
+ "self": 0.9853462019991639,
200
  "children": {
201
  "run_training.setup": {
202
+ "total": 0.04736289700031193,
203
  "count": 1,
204
+ "self": 0.04736289700031193
205
  },
206
  "TrainerController.start_learning": {
207
+ "total": 2136.989523927,
208
  "count": 1,
209
+ "self": 1.458595546028846,
210
  "children": {
211
  "TrainerController._reset_env": {
212
+ "total": 2.147141593000015,
213
  "count": 1,
214
+ "self": 2.147141593000015
215
  },
216
  "TrainerController.advance": {
217
+ "total": 2133.255490715972,
218
+ "count": 63628,
219
+ "self": 1.5977552797594399,
220
  "children": {
221
  "env_step": {
222
+ "total": 1490.3827759572332,
223
+ "count": 63628,
224
+ "self": 1354.185206475171,
225
  "children": {
226
  "SubprocessEnvManager._take_step": {
227
+ "total": 135.26424939209664,
228
+ "count": 63628,
229
+ "self": 4.834128640190102,
230
  "children": {
231
  "TorchPolicy.evaluate": {
232
+ "total": 130.43012075190654,
233
+ "count": 62551,
234
+ "self": 130.43012075190654
235
  }
236
  }
237
  },
238
  "workers": {
239
+ "total": 0.9333200899654912,
240
+ "count": 63628,
241
  "self": 0.0,
242
  "children": {
243
  "worker_root": {
244
+ "total": 2131.672288137017,
245
+ "count": 63628,
246
  "is_parallel": true,
247
+ "self": 900.1139222690681,
248
  "children": {
249
  "run_training.setup": {
250
  "total": 0.0,
 
253
  "self": 0.0,
254
  "children": {
255
  "steps_from_proto": {
256
+ "total": 0.0017603739997866796,
257
  "count": 1,
258
  "is_parallel": true,
259
+ "self": 0.0005314810023264727,
260
  "children": {
261
  "_process_rank_one_or_two_observation": {
262
+ "total": 0.001228892997460207,
263
  "count": 8,
264
  "is_parallel": true,
265
+ "self": 0.001228892997460207
266
  }
267
  }
268
  },
269
  "UnityEnvironment.step": {
270
+ "total": 0.04862397000033525,
271
  "count": 1,
272
  "is_parallel": true,
273
+ "self": 0.0005931800005782861,
274
  "children": {
275
  "UnityEnvironment._generate_step_input": {
276
+ "total": 0.0004881089998889365,
277
  "count": 1,
278
  "is_parallel": true,
279
+ "self": 0.0004881089998889365
280
  },
281
  "communicator.exchange": {
282
+ "total": 0.04590963299961004,
283
  "count": 1,
284
  "is_parallel": true,
285
+ "self": 0.04590963299961004
286
  },
287
  "steps_from_proto": {
288
+ "total": 0.0016330480002579861,
289
  "count": 1,
290
  "is_parallel": true,
291
+ "self": 0.00035718700019060634,
292
  "children": {
293
  "_process_rank_one_or_two_observation": {
294
+ "total": 0.0012758610000673798,
295
  "count": 8,
296
  "is_parallel": true,
297
+ "self": 0.0012758610000673798
298
  }
299
  }
300
  }
 
303
  }
304
  },
305
  "UnityEnvironment.step": {
306
+ "total": 1231.5583658679489,
307
+ "count": 63627,
308
  "is_parallel": true,
309
+ "self": 34.945650922931236,
310
  "children": {
311
  "UnityEnvironment._generate_step_input": {
312
+ "total": 24.486377486137826,
313
+ "count": 63627,
314
  "is_parallel": true,
315
+ "self": 24.486377486137826
316
  },
317
  "communicator.exchange": {
318
+ "total": 1073.1361114249412,
319
+ "count": 63627,
320
  "is_parallel": true,
321
+ "self": 1073.1361114249412
322
  },
323
  "steps_from_proto": {
324
+ "total": 98.9902260339386,
325
+ "count": 63627,
326
  "is_parallel": true,
327
+ "self": 20.087128791734358,
328
  "children": {
329
  "_process_rank_one_or_two_observation": {
330
+ "total": 78.90309724220424,
331
+ "count": 509016,
332
  "is_parallel": true,
333
+ "self": 78.90309724220424
334
  }
335
  }
336
  }
 
343
  }
344
  },
345
  "trainer_advance": {
346
+ "total": 641.2749594789793,
347
+ "count": 63628,
348
+ "self": 2.883373502001632,
349
  "children": {
350
  "process_trajectory": {
351
+ "total": 128.47727592296815,
352
+ "count": 63628,
353
+ "self": 128.2043659059682,
354
  "children": {
355
  "RLTrainer._checkpoint": {
356
+ "total": 0.2729100169999583,
357
  "count": 2,
358
+ "self": 0.2729100169999583
359
  }
360
  }
361
  },
362
  "_update_policy": {
363
+ "total": 509.91431005400955,
364
+ "count": 447,
365
+ "self": 302.8242494070273,
366
  "children": {
367
  "TorchPPOOptimizer.update": {
368
+ "total": 207.09006064698224,
369
+ "count": 22893,
370
+ "self": 207.09006064698224
371
  }
372
  }
373
  }
 
376
  }
377
  },
378
  "trainer_threads": {
379
+ "total": 1.2289992810110562e-06,
380
  "count": 1,
381
+ "self": 1.2289992810110562e-06
382
  },
383
  "TrainerController._save_models": {
384
+ "total": 0.1282948429998214,
385
  "count": 1,
386
+ "self": 0.002003808999688772,
387
  "children": {
388
  "RLTrainer._checkpoint": {
389
+ "total": 0.12629103400013264,
390
  "count": 1,
391
+ "self": 0.12629103400013264
392
  }
393
  }
394
  }
run_logs/training_status.json CHANGED
@@ -2,40 +2,40 @@
2
  "Pyramids": {
3
  "checkpoints": [
4
  {
5
- "steps": 499925,
6
- "file_path": "results/Pyramids Training-2/Pyramids/Pyramids-499925.onnx",
7
- "reward": -0.9996000528335571,
8
- "creation_time": 1704274353.265112,
9
  "auxillary_file_paths": [
10
- "results/Pyramids Training-2/Pyramids/Pyramids-499925.pt"
11
  ]
12
  },
13
  {
14
- "steps": 999925,
15
- "file_path": "results/Pyramids Training-2/Pyramids/Pyramids-999925.onnx",
16
- "reward": 0.16050000116229057,
17
- "creation_time": 1704275352.109694,
18
  "auxillary_file_paths": [
19
- "results/Pyramids Training-2/Pyramids/Pyramids-999925.pt"
20
  ]
21
  },
22
  {
23
- "steps": 1000053,
24
- "file_path": "results/Pyramids Training-2/Pyramids/Pyramids-1000053.onnx",
25
- "reward": 0.16050000116229057,
26
- "creation_time": 1704275352.2048194,
27
  "auxillary_file_paths": [
28
- "results/Pyramids Training-2/Pyramids/Pyramids-1000053.pt"
29
  ]
30
  }
31
  ],
32
  "final_checkpoint": {
33
- "steps": 1000053,
34
- "file_path": "results/Pyramids Training-2/Pyramids.onnx",
35
- "reward": 0.16050000116229057,
36
- "creation_time": 1704275352.2048194,
37
  "auxillary_file_paths": [
38
- "results/Pyramids Training-2/Pyramids/Pyramids-1000053.pt"
39
  ]
40
  }
41
  },
 
2
  "Pyramids": {
3
  "checkpoints": [
4
  {
5
+ "steps": 499955,
6
+ "file_path": "results/Pyramids Training-3/Pyramids/Pyramids-499955.onnx",
7
+ "reward": null,
8
+ "creation_time": 1704276891.3628292,
9
  "auxillary_file_paths": [
10
+ "results/Pyramids Training-3/Pyramids/Pyramids-499955.pt"
11
  ]
12
  },
13
  {
14
+ "steps": 999902,
15
+ "file_path": "results/Pyramids Training-3/Pyramids/Pyramids-999902.onnx",
16
+ "reward": null,
17
+ "creation_time": 1704278029.0157154,
18
  "auxillary_file_paths": [
19
+ "results/Pyramids Training-3/Pyramids/Pyramids-999902.pt"
20
  ]
21
  },
22
  {
23
+ "steps": 1000030,
24
+ "file_path": "results/Pyramids Training-3/Pyramids/Pyramids-1000030.onnx",
25
+ "reward": null,
26
+ "creation_time": 1704278029.1617928,
27
  "auxillary_file_paths": [
28
+ "results/Pyramids Training-3/Pyramids/Pyramids-1000030.pt"
29
  ]
30
  }
31
  ],
32
  "final_checkpoint": {
33
+ "steps": 1000030,
34
+ "file_path": "results/Pyramids Training-3/Pyramids.onnx",
35
+ "reward": null,
36
+ "creation_time": 1704278029.1617928,
37
  "auxillary_file_paths": [
38
+ "results/Pyramids Training-3/Pyramids/Pyramids-1000030.pt"
39
  ]
40
  }
41
  },