mihirdeo16
commited on
Commit
•
01297fc
1
Parent(s):
b99aa84
Upload . with huggingface_hub
Browse files- .summary/0/events.out.tfevents.1687392329.mihirs-MacBook-Air.local +3 -0
- README.md +1 -1
- checkpoint_p0/checkpoint_000001637_6114688.pth +3 -0
- config.json +1 -1
- replay.mp4 +2 -2
- sf_log.txt +604 -0
.summary/0/events.out.tfevents.1687392329.mihirs-MacBook-Air.local
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5f63543400f815854cc7a6521374edd91dab94363ee912e21a1392754f1c78c7
|
3 |
+
size 2343
|
README.md
CHANGED
@@ -15,7 +15,7 @@ model-index:
|
|
15 |
type: doom_health_gathering_supreme
|
16 |
metrics:
|
17 |
- type: mean_reward
|
18 |
-
value:
|
19 |
name: mean_reward
|
20 |
verified: false
|
21 |
---
|
|
|
15 |
type: doom_health_gathering_supreme
|
16 |
metrics:
|
17 |
- type: mean_reward
|
18 |
+
value: 10.73 +/- 4.77
|
19 |
name: mean_reward
|
20 |
verified: false
|
21 |
---
|
checkpoint_p0/checkpoint_000001637_6114688.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be770681681e0c1fcaac55e5c7ff45fedb6b1d68448575fa6db8e99885d52c30
|
3 |
+
size 34928851
|
config.json
CHANGED
@@ -65,7 +65,7 @@
|
|
65 |
"summaries_use_frameskip": true,
|
66 |
"heartbeat_interval": 20,
|
67 |
"heartbeat_reporting_interval": 600,
|
68 |
-
"train_for_env_steps":
|
69 |
"train_for_seconds": 10000000000,
|
70 |
"save_every_sec": 120,
|
71 |
"keep_checkpoints": 2,
|
|
|
65 |
"summaries_use_frameskip": true,
|
66 |
"heartbeat_interval": 20,
|
67 |
"heartbeat_reporting_interval": 600,
|
68 |
+
"train_for_env_steps": 4000000,
|
69 |
"train_for_seconds": 10000000000,
|
70 |
"save_every_sec": 120,
|
71 |
"keep_checkpoints": 2,
|
replay.mp4
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fae0e012497eea482d79cfa1324e2b488401a505f438be4ef39cc768ea49be6e
|
3 |
+
size 22048753
|
sf_log.txt
CHANGED
@@ -9950,3 +9950,607 @@ main_loop: 23380.8911
|
|
9950 |
[2023-06-21 19:17:03,450][78408] Another process currently holds the lock /var/folders/t0/cgrmhypx1kg2h122jm20kbnm0000gn/T/sf2_md/doom_002.lockfile, attempt: 1198
|
9951 |
[2023-06-21 19:17:04,899][78405] Another process currently holds the lock /var/folders/t0/cgrmhypx1kg2h122jm20kbnm0000gn/T/sf2_md/doom_002.lockfile, attempt: 1198
|
9952 |
[2023-06-21 19:17:05,230][78409] Another process currently holds the lock /var/folders/t0/cgrmhypx1kg2h122jm20kbnm0000gn/T/sf2_md/doom_002.lockfile, attempt: 1198
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
9950 |
[2023-06-21 19:17:03,450][78408] Another process currently holds the lock /var/folders/t0/cgrmhypx1kg2h122jm20kbnm0000gn/T/sf2_md/doom_002.lockfile, attempt: 1198
|
9951 |
[2023-06-21 19:17:04,899][78405] Another process currently holds the lock /var/folders/t0/cgrmhypx1kg2h122jm20kbnm0000gn/T/sf2_md/doom_002.lockfile, attempt: 1198
|
9952 |
[2023-06-21 19:17:05,230][78409] Another process currently holds the lock /var/folders/t0/cgrmhypx1kg2h122jm20kbnm0000gn/T/sf2_md/doom_002.lockfile, attempt: 1198
|
9953 |
+
[2023-06-21 19:17:13,689][62782] The model has been pushed to https://huggingface.co/mihirdeo16/vizdoom_health_gathering_supreme
|
9954 |
+
[2023-06-21 19:17:23,503][78408] Another process currently holds the lock /var/folders/t0/cgrmhypx1kg2h122jm20kbnm0000gn/T/sf2_md/doom_002.lockfile, attempt: 1199
|
9955 |
+
[2023-06-21 19:17:24,937][78405] Another process currently holds the lock /var/folders/t0/cgrmhypx1kg2h122jm20kbnm0000gn/T/sf2_md/doom_002.lockfile, attempt: 1199
|
9956 |
+
[2023-06-21 19:17:25,270][78409] Another process currently holds the lock /var/folders/t0/cgrmhypx1kg2h122jm20kbnm0000gn/T/sf2_md/doom_002.lockfile, attempt: 1199
|
9957 |
+
[2023-06-21 19:17:43,528][78408] Another process currently holds the lock /var/folders/t0/cgrmhypx1kg2h122jm20kbnm0000gn/T/sf2_md/doom_002.lockfile, attempt: 1200
|
9958 |
+
[2023-06-21 19:17:44,988][78405] Another process currently holds the lock /var/folders/t0/cgrmhypx1kg2h122jm20kbnm0000gn/T/sf2_md/doom_002.lockfile, attempt: 1200
|
9959 |
+
[2023-06-21 19:17:45,287][78409] Another process currently holds the lock /var/folders/t0/cgrmhypx1kg2h122jm20kbnm0000gn/T/sf2_md/doom_002.lockfile, attempt: 1200
|
9960 |
+
[2023-06-21 19:18:03,538][78408] Another process currently holds the lock /var/folders/t0/cgrmhypx1kg2h122jm20kbnm0000gn/T/sf2_md/doom_002.lockfile, attempt: 1201
|
9961 |
+
[2023-06-21 19:18:05,035][78405] Another process currently holds the lock /var/folders/t0/cgrmhypx1kg2h122jm20kbnm0000gn/T/sf2_md/doom_002.lockfile, attempt: 1201
|
9962 |
+
[2023-06-21 19:18:05,319][78409] Another process currently holds the lock /var/folders/t0/cgrmhypx1kg2h122jm20kbnm0000gn/T/sf2_md/doom_002.lockfile, attempt: 1201
|
9963 |
+
[2023-06-21 19:18:23,543][78408] Another process currently holds the lock /var/folders/t0/cgrmhypx1kg2h122jm20kbnm0000gn/T/sf2_md/doom_002.lockfile, attempt: 1202
|
9964 |
+
[2023-06-21 19:18:25,067][78405] Another process currently holds the lock /var/folders/t0/cgrmhypx1kg2h122jm20kbnm0000gn/T/sf2_md/doom_002.lockfile, attempt: 1202
|
9965 |
+
[2023-06-21 19:18:25,331][78409] Another process currently holds the lock /var/folders/t0/cgrmhypx1kg2h122jm20kbnm0000gn/T/sf2_md/doom_002.lockfile, attempt: 1202
|
9966 |
+
[2023-06-21 19:18:43,577][78408] Another process currently holds the lock /var/folders/t0/cgrmhypx1kg2h122jm20kbnm0000gn/T/sf2_md/doom_002.lockfile, attempt: 1203
|
9967 |
+
[2023-06-21 19:18:45,091][78405] Another process currently holds the lock /var/folders/t0/cgrmhypx1kg2h122jm20kbnm0000gn/T/sf2_md/doom_002.lockfile, attempt: 1203
|
9968 |
+
[2023-06-21 19:18:45,368][78409] Another process currently holds the lock /var/folders/t0/cgrmhypx1kg2h122jm20kbnm0000gn/T/sf2_md/doom_002.lockfile, attempt: 1203
|
9969 |
+
[2023-06-21 19:19:03,619][78408] Another process currently holds the lock /var/folders/t0/cgrmhypx1kg2h122jm20kbnm0000gn/T/sf2_md/doom_002.lockfile, attempt: 1204
|
9970 |
+
[2023-06-21 19:19:05,106][78405] Another process currently holds the lock /var/folders/t0/cgrmhypx1kg2h122jm20kbnm0000gn/T/sf2_md/doom_002.lockfile, attempt: 1204
|
9971 |
+
[2023-06-21 19:19:05,385][78409] Another process currently holds the lock /var/folders/t0/cgrmhypx1kg2h122jm20kbnm0000gn/T/sf2_md/doom_002.lockfile, attempt: 1204
|
9972 |
+
[2023-06-21 19:19:23,676][78408] Another process currently holds the lock /var/folders/t0/cgrmhypx1kg2h122jm20kbnm0000gn/T/sf2_md/doom_002.lockfile, attempt: 1205
|
9973 |
+
[2023-06-21 19:19:25,133][78405] Another process currently holds the lock /var/folders/t0/cgrmhypx1kg2h122jm20kbnm0000gn/T/sf2_md/doom_002.lockfile, attempt: 1205
|
9974 |
+
[2023-06-21 19:19:25,439][78409] Another process currently holds the lock /var/folders/t0/cgrmhypx1kg2h122jm20kbnm0000gn/T/sf2_md/doom_002.lockfile, attempt: 1205
|
9975 |
+
[2023-06-21 19:19:30,406][78404] VizDoom game.init() threw an exception ViZDoomErrorException('Unexpected ViZDoom instance crash.'). Terminate process...
|
9976 |
+
[2023-06-21 19:19:30,426][78404] EvtLoop [rollout_proc2_evt_loop, process=rollout_proc2] unhandled exception in slot='init' connected to emitter=Emitter(object_id='Sampler', signal_name='_inference_workers_initialized'), args=()
|
9977 |
+
Traceback (most recent call last):
|
9978 |
+
File "/Users/md/opt/miniconda3/envs/hf/lib/python3.10/site-packages/sf_examples/vizdoom/doom/doom_gym.py", line 228, in _game_init
|
9979 |
+
self.game.init()
|
9980 |
+
vizdoom.vizdoom.ViZDoomErrorException: Unexpected ViZDoom instance crash.
|
9981 |
+
|
9982 |
+
During handling of the above exception, another exception occurred:
|
9983 |
+
|
9984 |
+
Traceback (most recent call last):
|
9985 |
+
File "/Users/md/opt/miniconda3/envs/hf/lib/python3.10/site-packages/signal_slot/signal_slot.py", line 355, in _process_signal
|
9986 |
+
slot_callable(*args)
|
9987 |
+
File "/Users/md/opt/miniconda3/envs/hf/lib/python3.10/site-packages/sample_factory/algo/sampling/rollout_worker.py", line 150, in init
|
9988 |
+
env_runner.init(self.timing)
|
9989 |
+
File "/Users/md/opt/miniconda3/envs/hf/lib/python3.10/site-packages/sample_factory/algo/sampling/non_batched_sampling.py", line 418, in init
|
9990 |
+
self._reset()
|
9991 |
+
File "/Users/md/opt/miniconda3/envs/hf/lib/python3.10/site-packages/sample_factory/algo/sampling/non_batched_sampling.py", line 430, in _reset
|
9992 |
+
observations, info = e.reset(seed=seed) # new way of doing seeding since Gym 0.26.0
|
9993 |
+
File "/Users/md/opt/miniconda3/envs/hf/lib/python3.10/site-packages/gymnasium/core.py", line 414, in reset
|
9994 |
+
return self.env.reset(seed=seed, options=options)
|
9995 |
+
File "/Users/md/opt/miniconda3/envs/hf/lib/python3.10/site-packages/sample_factory/algo/utils/make_env.py", line 125, in reset
|
9996 |
+
obs, info = self.env.reset(**kwargs)
|
9997 |
+
File "/Users/md/opt/miniconda3/envs/hf/lib/python3.10/site-packages/sample_factory/algo/utils/make_env.py", line 110, in reset
|
9998 |
+
obs, info = self.env.reset(**kwargs)
|
9999 |
+
File "/Users/md/opt/miniconda3/envs/hf/lib/python3.10/site-packages/sf_examples/vizdoom/doom/wrappers/scenario_wrappers/gathering_reward_shaping.py", line 30, in reset
|
10000 |
+
return self.env.reset(**kwargs)
|
10001 |
+
File "/Users/md/opt/miniconda3/envs/hf/lib/python3.10/site-packages/gymnasium/core.py", line 462, in reset
|
10002 |
+
obs, info = self.env.reset(seed=seed, options=options)
|
10003 |
+
File "/Users/md/opt/miniconda3/envs/hf/lib/python3.10/site-packages/sample_factory/envs/env_wrappers.py", line 82, in reset
|
10004 |
+
obs, info = self.env.reset(**kwargs)
|
10005 |
+
File "/Users/md/opt/miniconda3/envs/hf/lib/python3.10/site-packages/gymnasium/core.py", line 414, in reset
|
10006 |
+
return self.env.reset(seed=seed, options=options)
|
10007 |
+
File "/Users/md/opt/miniconda3/envs/hf/lib/python3.10/site-packages/sf_examples/vizdoom/doom/wrappers/multiplayer_stats.py", line 51, in reset
|
10008 |
+
return self.env.reset(**kwargs)
|
10009 |
+
File "/Users/md/opt/miniconda3/envs/hf/lib/python3.10/site-packages/sf_examples/vizdoom/doom/doom_gym.py", line 323, in reset
|
10010 |
+
self._ensure_initialized()
|
10011 |
+
File "/Users/md/opt/miniconda3/envs/hf/lib/python3.10/site-packages/sf_examples/vizdoom/doom/doom_gym.py", line 274, in _ensure_initialized
|
10012 |
+
self.initialize()
|
10013 |
+
File "/Users/md/opt/miniconda3/envs/hf/lib/python3.10/site-packages/sf_examples/vizdoom/doom/doom_gym.py", line 269, in initialize
|
10014 |
+
self._game_init()
|
10015 |
+
File "/Users/md/opt/miniconda3/envs/hf/lib/python3.10/site-packages/sf_examples/vizdoom/doom/doom_gym.py", line 244, in _game_init
|
10016 |
+
raise EnvCriticalError()
|
10017 |
+
sample_factory.envs.env_utils.EnvCriticalError
|
10018 |
+
[2023-06-21 19:19:30,439][78404] Unhandled exception in evt loop rollout_proc2_evt_loop
|
10019 |
+
[2023-06-21 19:19:31,063][78408] Decorrelating experience for 32 frames...
|
10020 |
+
[2023-06-21 19:19:31,698][78405] Decorrelating experience for 32 frames...
|
10021 |
+
[2023-06-21 19:19:32,297][78409] Decorrelating experience for 64 frames...
|
10022 |
+
[2023-06-21 19:19:32,548][78408] Decorrelating experience for 64 frames...
|
10023 |
+
[2023-06-21 19:19:33,144][78405] Decorrelating experience for 64 frames...
|
10024 |
+
[2023-06-21 19:19:34,607][78409] Decorrelating experience for 96 frames...
|
10025 |
+
[2023-06-21 19:19:34,789][78408] Decorrelating experience for 96 frames...
|
10026 |
+
[2023-06-21 19:19:35,458][78405] Decorrelating experience for 96 frames...
|
10027 |
+
[2023-06-21 19:19:37,212][78409] Stopping RolloutWorker_w6...
|
10028 |
+
[2023-06-21 19:19:37,212][78409] Loop rollout_proc6_evt_loop terminating...
|
10029 |
+
[2023-06-21 19:19:38,966][78405] EvtLoop [rollout_proc3_evt_loop, process=rollout_proc3] unhandled exception in slot='init' connected to emitter=Emitter(object_id='Sampler', signal_name='_inference_workers_initialized'), args=()
|
10030 |
+
Traceback (most recent call last):
|
10031 |
+
File "/Users/md/opt/miniconda3/envs/hf/lib/python3.10/site-packages/signal_slot/signal_slot.py", line 355, in _process_signal
|
10032 |
+
slot_callable(*args)
|
10033 |
+
File "/Users/md/opt/miniconda3/envs/hf/lib/python3.10/site-packages/sample_factory/algo/sampling/rollout_worker.py", line 150, in init
|
10034 |
+
env_runner.init(self.timing)
|
10035 |
+
File "/Users/md/opt/miniconda3/envs/hf/lib/python3.10/site-packages/sample_factory/algo/sampling/non_batched_sampling.py", line 418, in init
|
10036 |
+
self._reset()
|
10037 |
+
File "/Users/md/opt/miniconda3/envs/hf/lib/python3.10/site-packages/sample_factory/algo/sampling/non_batched_sampling.py", line 439, in _reset
|
10038 |
+
observations, rew, terminated, truncated, info = e.step(actions)
|
10039 |
+
File "/Users/md/opt/miniconda3/envs/hf/lib/python3.10/site-packages/gymnasium/core.py", line 408, in step
|
10040 |
+
return self.env.step(action)
|
10041 |
+
File "/Users/md/opt/miniconda3/envs/hf/lib/python3.10/site-packages/sample_factory/algo/utils/make_env.py", line 129, in step
|
10042 |
+
obs, rew, terminated, truncated, info = self.env.step(action)
|
10043 |
+
File "/Users/md/opt/miniconda3/envs/hf/lib/python3.10/site-packages/sample_factory/algo/utils/make_env.py", line 115, in step
|
10044 |
+
obs, rew, terminated, truncated, info = self.env.step(action)
|
10045 |
+
File "/Users/md/opt/miniconda3/envs/hf/lib/python3.10/site-packages/sf_examples/vizdoom/doom/wrappers/scenario_wrappers/gathering_reward_shaping.py", line 33, in step
|
10046 |
+
observation, reward, terminated, truncated, info = self.env.step(action)
|
10047 |
+
File "/Users/md/opt/miniconda3/envs/hf/lib/python3.10/site-packages/gymnasium/core.py", line 469, in step
|
10048 |
+
observation, reward, terminated, truncated, info = self.env.step(action)
|
10049 |
+
File "/Users/md/opt/miniconda3/envs/hf/lib/python3.10/site-packages/sample_factory/envs/env_wrappers.py", line 86, in step
|
10050 |
+
obs, reward, terminated, truncated, info = self.env.step(action)
|
10051 |
+
File "/Users/md/opt/miniconda3/envs/hf/lib/python3.10/site-packages/gymnasium/core.py", line 408, in step
|
10052 |
+
return self.env.step(action)
|
10053 |
+
File "/Users/md/opt/miniconda3/envs/hf/lib/python3.10/site-packages/sf_examples/vizdoom/doom/wrappers/multiplayer_stats.py", line 54, in step
|
10054 |
+
obs, reward, terminated, truncated, info = self.env.step(action)
|
10055 |
+
File "/Users/md/opt/miniconda3/envs/hf/lib/python3.10/site-packages/sf_examples/vizdoom/doom/doom_gym.py", line 452, in step
|
10056 |
+
reward = self.game.make_action(actions_flattened, self.skip_frames)
|
10057 |
+
vizdoom.vizdoom.ViZDoomUnexpectedExitException: Controlled ViZDoom instance exited unexpectedly.
|
10058 |
+
[2023-06-21 19:19:38,971][78405] Unhandled exception Controlled ViZDoom instance exited unexpectedly. in evt loop rollout_proc3_evt_loop
|
10059 |
+
[2023-06-21 20:05:30,124][03300] Saving configuration to /Users/md/Code/python/jubilant-memory/RL/train_dir/default_experiment/config.json...
|
10060 |
+
[2023-06-21 20:05:30,146][03300] Rollout worker 0 uses device cpu
|
10061 |
+
[2023-06-21 20:05:30,147][03300] Rollout worker 1 uses device cpu
|
10062 |
+
[2023-06-21 20:05:30,148][03300] Rollout worker 2 uses device cpu
|
10063 |
+
[2023-06-21 20:05:30,148][03300] Rollout worker 3 uses device cpu
|
10064 |
+
[2023-06-21 20:05:30,148][03300] Rollout worker 4 uses device cpu
|
10065 |
+
[2023-06-21 20:05:30,148][03300] Rollout worker 5 uses device cpu
|
10066 |
+
[2023-06-21 20:05:30,149][03300] Rollout worker 6 uses device cpu
|
10067 |
+
[2023-06-21 20:05:30,149][03300] Rollout worker 7 uses device cpu
|
10068 |
+
[2023-06-21 20:05:30,359][03300] InferenceWorker_p0-w0: min num requests: 2
|
10069 |
+
[2023-06-21 20:05:30,393][03300] Starting all processes...
|
10070 |
+
[2023-06-21 20:05:30,394][03300] Starting process learner_proc0
|
10071 |
+
[2023-06-21 20:05:30,448][03300] Starting all processes...
|
10072 |
+
[2023-06-21 20:05:30,452][03300] Starting process inference_proc0-0
|
10073 |
+
[2023-06-21 20:05:30,452][03300] Starting process rollout_proc0
|
10074 |
+
[2023-06-21 20:05:30,452][03300] Starting process rollout_proc1
|
10075 |
+
[2023-06-21 20:05:30,452][03300] Starting process rollout_proc2
|
10076 |
+
[2023-06-21 20:05:30,452][03300] Starting process rollout_proc3
|
10077 |
+
[2023-06-21 20:05:30,452][03300] Starting process rollout_proc4
|
10078 |
+
[2023-06-21 20:05:30,452][03300] Starting process rollout_proc5
|
10079 |
+
[2023-06-21 20:05:30,453][03300] Starting process rollout_proc6
|
10080 |
+
[2023-06-21 20:05:30,453][03300] Starting process rollout_proc7
|
10081 |
+
[2023-06-21 20:05:32,460][03737] On MacOS, not setting affinity
|
10082 |
+
[2023-06-21 20:05:32,464][03739] On MacOS, not setting affinity
|
10083 |
+
[2023-06-21 20:05:32,478][03736] Starting seed is not provided
|
10084 |
+
[2023-06-21 20:05:32,478][03736] Initializing actor-critic model on device cpu
|
10085 |
+
[2023-06-21 20:05:32,478][03736] RunningMeanStd input shape: (3, 72, 128)
|
10086 |
+
[2023-06-21 20:05:32,483][03736] RunningMeanStd input shape: (1,)
|
10087 |
+
[2023-06-21 20:05:32,494][03740] On MacOS, not setting affinity
|
10088 |
+
[2023-06-21 20:05:32,494][03742] On MacOS, not setting affinity
|
10089 |
+
[2023-06-21 20:05:32,499][03736] ConvEncoder: input_channels=3
|
10090 |
+
[2023-06-21 20:05:32,560][03743] On MacOS, not setting affinity
|
10091 |
+
[2023-06-21 20:05:32,579][03744] On MacOS, not setting affinity
|
10092 |
+
[2023-06-21 20:05:32,584][03745] On MacOS, not setting affinity
|
10093 |
+
[2023-06-21 20:05:32,591][03741] On MacOS, not setting affinity
|
10094 |
+
[2023-06-21 20:05:32,609][03736] Conv encoder output size: 512
|
10095 |
+
[2023-06-21 20:05:32,609][03736] Policy head output size: 512
|
10096 |
+
[2023-06-21 20:05:32,628][03736] Created Actor Critic model with architecture:
|
10097 |
+
[2023-06-21 20:05:32,629][03736] ActorCriticSharedWeights(
|
10098 |
+
(obs_normalizer): ObservationNormalizer(
|
10099 |
+
(running_mean_std): RunningMeanStdDictInPlace(
|
10100 |
+
(running_mean_std): ModuleDict(
|
10101 |
+
(obs): RunningMeanStdInPlace()
|
10102 |
+
)
|
10103 |
+
)
|
10104 |
+
)
|
10105 |
+
(returns_normalizer): RecursiveScriptModule(original_name=RunningMeanStdInPlace)
|
10106 |
+
(encoder): VizdoomEncoder(
|
10107 |
+
(basic_encoder): ConvEncoder(
|
10108 |
+
(enc): RecursiveScriptModule(
|
10109 |
+
original_name=ConvEncoderImpl
|
10110 |
+
(conv_head): RecursiveScriptModule(
|
10111 |
+
original_name=Sequential
|
10112 |
+
(0): RecursiveScriptModule(original_name=Conv2d)
|
10113 |
+
(1): RecursiveScriptModule(original_name=ELU)
|
10114 |
+
(2): RecursiveScriptModule(original_name=Conv2d)
|
10115 |
+
(3): RecursiveScriptModule(original_name=ELU)
|
10116 |
+
(4): RecursiveScriptModule(original_name=Conv2d)
|
10117 |
+
(5): RecursiveScriptModule(original_name=ELU)
|
10118 |
+
)
|
10119 |
+
(mlp_layers): RecursiveScriptModule(
|
10120 |
+
original_name=Sequential
|
10121 |
+
(0): RecursiveScriptModule(original_name=Linear)
|
10122 |
+
(1): RecursiveScriptModule(original_name=ELU)
|
10123 |
+
)
|
10124 |
+
)
|
10125 |
+
)
|
10126 |
+
)
|
10127 |
+
(core): ModelCoreRNN(
|
10128 |
+
(core): GRU(512, 512)
|
10129 |
+
)
|
10130 |
+
(decoder): MlpDecoder(
|
10131 |
+
(mlp): Identity()
|
10132 |
+
)
|
10133 |
+
(critic_linear): Linear(in_features=512, out_features=1, bias=True)
|
10134 |
+
(action_parameterization): ActionParameterizationDefault(
|
10135 |
+
(distribution_linear): Linear(in_features=512, out_features=5, bias=True)
|
10136 |
+
)
|
10137 |
+
)
|
10138 |
+
[2023-06-21 20:05:32,635][03736] Using optimizer <class 'torch.optim.adam.Adam'>
|
10139 |
+
[2023-06-21 20:05:32,636][03736] Loading state from checkpoint /Users/md/Code/python/jubilant-memory/RL/train_dir/default_experiment/checkpoint_p0/checkpoint_000001636_6111488.pth...
|
10140 |
+
[2023-06-21 20:05:32,674][03736] Loading model from checkpoint
|
10141 |
+
[2023-06-21 20:05:32,680][03736] Loaded experiment state at self.train_step=1636, self.env_steps=6111488
|
10142 |
+
[2023-06-21 20:05:32,681][03736] Initialized policy 0 weights for model version 1636
|
10143 |
+
[2023-06-21 20:05:32,682][03736] LearnerWorker_p0 finished initialization!
|
10144 |
+
[2023-06-21 20:05:32,685][03738] RunningMeanStd input shape: (3, 72, 128)
|
10145 |
+
[2023-06-21 20:05:32,685][03738] RunningMeanStd input shape: (1,)
|
10146 |
+
[2023-06-21 20:05:32,699][03738] ConvEncoder: input_channels=3
|
10147 |
+
[2023-06-21 20:05:32,751][03738] Conv encoder output size: 512
|
10148 |
+
[2023-06-21 20:05:32,751][03738] Policy head output size: 512
|
10149 |
+
[2023-06-21 20:05:32,760][03300] Inference worker 0-0 is ready!
|
10150 |
+
[2023-06-21 20:05:32,761][03300] All inference workers are ready! Signal rollout workers to start!
|
10151 |
+
[2023-06-21 20:05:32,797][03744] Doom resolution: 160x120, resize resolution: (128, 72)
|
10152 |
+
[2023-06-21 20:05:32,809][03743] Doom resolution: 160x120, resize resolution: (128, 72)
|
10153 |
+
[2023-06-21 20:05:32,809][03740] Doom resolution: 160x120, resize resolution: (128, 72)
|
10154 |
+
[2023-06-21 20:05:32,810][03745] Doom resolution: 160x120, resize resolution: (128, 72)
|
10155 |
+
[2023-06-21 20:05:32,815][03742] Doom resolution: 160x120, resize resolution: (128, 72)
|
10156 |
+
[2023-06-21 20:05:32,816][03741] Doom resolution: 160x120, resize resolution: (128, 72)
|
10157 |
+
[2023-06-21 20:05:32,820][03739] Doom resolution: 160x120, resize resolution: (128, 72)
|
10158 |
+
[2023-06-21 20:05:32,819][03737] Doom resolution: 160x120, resize resolution: (128, 72)
|
10159 |
+
[2023-06-21 20:05:34,186][03741] Decorrelating experience for 0 frames...
|
10160 |
+
[2023-06-21 20:05:34,188][03737] Decorrelating experience for 0 frames...
|
10161 |
+
[2023-06-21 20:05:34,188][03743] Decorrelating experience for 0 frames...
|
10162 |
+
[2023-06-21 20:05:34,192][03740] Decorrelating experience for 0 frames...
|
10163 |
+
[2023-06-21 20:05:34,195][03742] Decorrelating experience for 0 frames...
|
10164 |
+
[2023-06-21 20:05:34,203][03739] Decorrelating experience for 0 frames...
|
10165 |
+
[2023-06-21 20:05:34,307][03300] Fps is (10 sec: nan, 60 sec: nan, 300 sec: nan). Total num frames: 6111488. Throughput: 0: nan. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)
|
10166 |
+
[2023-06-21 20:05:35,168][03740] Decorrelating experience for 32 frames...
|
10167 |
+
[2023-06-21 20:05:35,177][03741] Decorrelating experience for 32 frames...
|
10168 |
+
[2023-06-21 20:05:35,180][03737] Decorrelating experience for 32 frames...
|
10169 |
+
[2023-06-21 20:05:35,180][03744] Decorrelating experience for 0 frames...
|
10170 |
+
[2023-06-21 20:05:35,183][03743] Decorrelating experience for 32 frames...
|
10171 |
+
[2023-06-21 20:05:35,183][03739] Decorrelating experience for 32 frames...
|
10172 |
+
[2023-06-21 20:05:35,943][03744] Decorrelating experience for 32 frames...
|
10173 |
+
[2023-06-21 20:05:35,945][03742] Decorrelating experience for 32 frames...
|
10174 |
+
[2023-06-21 20:05:36,706][03745] Decorrelating experience for 0 frames...
|
10175 |
+
[2023-06-21 20:05:36,815][03737] Decorrelating experience for 64 frames...
|
10176 |
+
[2023-06-21 20:05:36,815][03740] Decorrelating experience for 64 frames...
|
10177 |
+
[2023-06-21 20:05:36,819][03739] Decorrelating experience for 64 frames...
|
10178 |
+
[2023-06-21 20:05:37,483][03745] Decorrelating experience for 32 frames...
|
10179 |
+
[2023-06-21 20:05:37,486][03741] Decorrelating experience for 64 frames...
|
10180 |
+
[2023-06-21 20:05:37,550][03743] Decorrelating experience for 64 frames...
|
10181 |
+
[2023-06-21 20:05:38,238][03742] Decorrelating experience for 64 frames...
|
10182 |
+
[2023-06-21 20:05:38,241][03744] Decorrelating experience for 64 frames...
|
10183 |
+
[2023-06-21 20:05:39,013][03745] Decorrelating experience for 64 frames...
|
10184 |
+
[2023-06-21 20:05:39,063][03739] Decorrelating experience for 96 frames...
|
10185 |
+
[2023-06-21 20:05:39,137][03737] Decorrelating experience for 96 frames...
|
10186 |
+
[2023-06-21 20:05:39,169][03740] Decorrelating experience for 96 frames...
|
10187 |
+
[2023-06-21 20:05:39,307][03300] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 6111488. Throughput: 0: 0.0. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)
|
10188 |
+
[2023-06-21 20:05:39,810][03741] Decorrelating experience for 96 frames...
|
10189 |
+
[2023-06-21 20:05:39,850][03743] Decorrelating experience for 96 frames...
|
10190 |
+
[2023-06-21 20:05:40,542][03742] Decorrelating experience for 96 frames...
|
10191 |
+
[2023-06-21 20:05:40,549][03744] Decorrelating experience for 96 frames...
|
10192 |
+
[2023-06-21 20:05:41,291][03745] Decorrelating experience for 96 frames...
|
10193 |
+
[2023-06-21 20:05:44,306][03300] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 6111488. Throughput: 0: 3.8. Samples: 38. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)
|
10194 |
+
[2023-06-21 20:05:44,308][03300] Avg episode reward: [(0, '0.570')]
|
10195 |
+
[2023-06-21 20:05:47,764][03736] Stopping Batcher_0...
|
10196 |
+
[2023-06-21 20:05:47,764][03736] Saving /Users/md/Code/python/jubilant-memory/RL/train_dir/default_experiment/checkpoint_p0/checkpoint_000001637_6114688.pth...
|
10197 |
+
[2023-06-21 20:05:47,767][03300] Component Batcher_0 stopped!
|
10198 |
+
[2023-06-21 20:05:47,764][03736] Loop batcher_evt_loop terminating...
|
10199 |
+
[2023-06-21 20:05:47,910][03738] Weights refcount: 2 0
|
10200 |
+
[2023-06-21 20:05:47,912][03738] Stopping InferenceWorker_p0-w0...
|
10201 |
+
[2023-06-21 20:05:47,912][03738] Loop inference_proc0-0_evt_loop terminating...
|
10202 |
+
[2023-06-21 20:05:47,914][03300] Component InferenceWorker_p0-w0 stopped!
|
10203 |
+
[2023-06-21 20:05:47,956][03741] Stopping RolloutWorker_w3...
|
10204 |
+
[2023-06-21 20:05:47,958][03741] Loop rollout_proc3_evt_loop terminating...
|
10205 |
+
[2023-06-21 20:05:47,974][03742] Stopping RolloutWorker_w4...
|
10206 |
+
[2023-06-21 20:05:47,975][03742] Loop rollout_proc4_evt_loop terminating...
|
10207 |
+
[2023-06-21 20:05:47,980][03736] Removing /Users/md/Code/python/jubilant-memory/RL/train_dir/default_experiment/checkpoint_p0/checkpoint_000001612_6034688.pth
|
10208 |
+
[2023-06-21 20:05:47,985][03737] Stopping RolloutWorker_w0...
|
10209 |
+
[2023-06-21 20:05:47,985][03737] Loop rollout_proc0_evt_loop terminating...
|
10210 |
+
[2023-06-21 20:05:47,989][03745] Stopping RolloutWorker_w7...
|
10211 |
+
[2023-06-21 20:05:47,996][03745] Loop rollout_proc7_evt_loop terminating...
|
10212 |
+
[2023-06-21 20:05:48,006][03743] Stopping RolloutWorker_w5...
|
10213 |
+
[2023-06-21 20:05:48,009][03743] Loop rollout_proc5_evt_loop terminating...
|
10214 |
+
[2023-06-21 20:05:48,016][03736] Saving /Users/md/Code/python/jubilant-memory/RL/train_dir/default_experiment/checkpoint_p0/checkpoint_000001637_6114688.pth...
|
10215 |
+
[2023-06-21 20:05:48,001][03300] Component RolloutWorker_w3 stopped!
|
10216 |
+
[2023-06-21 20:05:48,016][03740] Stopping RolloutWorker_w2...
|
10217 |
+
[2023-06-21 20:05:48,018][03740] Loop rollout_proc2_evt_loop terminating...
|
10218 |
+
[2023-06-21 20:05:48,018][03744] Stopping RolloutWorker_w6...
|
10219 |
+
[2023-06-21 20:05:48,019][03744] Loop rollout_proc6_evt_loop terminating...
|
10220 |
+
[2023-06-21 20:05:48,017][03300] Component RolloutWorker_w4 stopped!
|
10221 |
+
[2023-06-21 20:05:48,065][03739] Stopping RolloutWorker_w1...
|
10222 |
+
[2023-06-21 20:05:48,065][03739] Loop rollout_proc1_evt_loop terminating...
|
10223 |
+
[2023-06-21 20:05:48,025][03300] Component RolloutWorker_w0 stopped!
|
10224 |
+
[2023-06-21 20:05:48,076][03300] Component RolloutWorker_w7 stopped!
|
10225 |
+
[2023-06-21 20:05:48,078][03300] Component RolloutWorker_w5 stopped!
|
10226 |
+
[2023-06-21 20:05:48,079][03300] Component RolloutWorker_w2 stopped!
|
10227 |
+
[2023-06-21 20:05:48,080][03300] Component RolloutWorker_w6 stopped!
|
10228 |
+
[2023-06-21 20:05:48,080][03300] Component RolloutWorker_w1 stopped!
|
10229 |
+
[2023-06-21 20:05:48,159][03736] Stopping LearnerWorker_p0...
|
10230 |
+
[2023-06-21 20:05:48,159][03736] Loop learner_proc0_evt_loop terminating...
|
10231 |
+
[2023-06-21 20:05:48,159][03300] Component LearnerWorker_p0 stopped!
|
10232 |
+
[2023-06-21 20:05:48,161][03300] Waiting for process learner_proc0 to stop...
|
10233 |
+
[2023-06-21 20:05:48,512][03300] Waiting for process inference_proc0-0 to join...
|
10234 |
+
[2023-06-21 20:05:48,513][03300] Waiting for process rollout_proc0 to join...
|
10235 |
+
[2023-06-21 20:05:48,513][03300] Waiting for process rollout_proc1 to join...
|
10236 |
+
[2023-06-21 20:05:48,514][03300] Waiting for process rollout_proc2 to join...
|
10237 |
+
[2023-06-21 20:05:48,514][03300] Waiting for process rollout_proc3 to join...
|
10238 |
+
[2023-06-21 20:05:48,515][03300] Waiting for process rollout_proc4 to join...
|
10239 |
+
[2023-06-21 20:05:48,515][03300] Waiting for process rollout_proc5 to join...
|
10240 |
+
[2023-06-21 20:05:48,515][03300] Waiting for process rollout_proc6 to join...
|
10241 |
+
[2023-06-21 20:05:48,515][03300] Waiting for process rollout_proc7 to join...
|
10242 |
+
[2023-06-21 20:05:48,516][03300] Batcher 0 profile tree view:
|
10243 |
+
batching: 0.0072, releasing_batches: 0.0000
|
10244 |
+
[2023-06-21 20:05:48,516][03300] InferenceWorker_p0-w0 profile tree view:
|
10245 |
+
wait_policy: 0.0040
|
10246 |
+
wait_policy_total: 13.0879
|
10247 |
+
update_model: 0.0109
|
10248 |
+
weight_update: 0.0029
|
10249 |
+
one_step: 0.0054
|
10250 |
+
handle_policy_step: 1.7860
|
10251 |
+
deserialize: 0.0178, stack: 0.0034, obs_to_device_normalize: 0.1252, forward: 1.5687, send_messages: 0.0158
|
10252 |
+
prepare_outputs: 0.0213
|
10253 |
+
to_cpu: 0.0024
|
10254 |
+
[2023-06-21 20:05:48,516][03300] Learner 0 profile tree view:
|
10255 |
+
misc: 0.0000, prepare_batch: 0.3879
|
10256 |
+
train: 1.2408
|
10257 |
+
epoch_init: 0.0000, minibatch_init: 0.0000, losses_postprocess: 0.0003, kl_divergence: 0.0007, after_optimizer: 0.0031
|
10258 |
+
calculate_losses: 0.7032
|
10259 |
+
losses_init: 0.0000, forward_head: 0.6612, bptt_initial: 0.0082, tail: 0.0032, advantages_returns: 0.0018, losses: 0.0048
|
10260 |
+
bptt: 0.0231
|
10261 |
+
bptt_forward_core: 0.0229
|
10262 |
+
update: 0.5322
|
10263 |
+
clip: 0.0019
|
10264 |
+
[2023-06-21 20:05:48,517][03300] RolloutWorker_w0 profile tree view:
|
10265 |
+
wait_for_trajectories: 0.0006, enqueue_policy_requests: 0.0150, env_step: 6.1927, overhead: 0.0136, complete_rollouts: 0.0002
|
10266 |
+
save_policy_outputs: 0.0078
|
10267 |
+
split_output_tensors: 0.0041
|
10268 |
+
[2023-06-21 20:05:48,517][03300] RolloutWorker_w7 profile tree view:
|
10269 |
+
wait_for_trajectories: 0.0003, enqueue_policy_requests: 0.0084, env_step: 4.0969, overhead: 0.0086, complete_rollouts: 0.0002
|
10270 |
+
save_policy_outputs: 0.0043
|
10271 |
+
split_output_tensors: 0.0022
|
10272 |
+
[2023-06-21 20:05:48,518][03300] Loop Runner_EvtLoop terminating...
|
10273 |
+
[2023-06-21 20:05:48,518][03300] Runner profile tree view:
|
10274 |
+
main_loop: 18.1250
|
10275 |
+
[2023-06-21 20:05:48,518][03300] Collected {0: 6114688}, FPS: 176.6
|
10276 |
+
[2023-06-21 20:07:06,012][03300] Loading existing experiment configuration from /Users/md/Code/python/jubilant-memory/RL/train_dir/default_experiment/config.json
|
10277 |
+
[2023-06-21 20:07:06,013][03300] Overriding arg 'num_workers' with value 1 passed from command line
|
10278 |
+
[2023-06-21 20:07:06,014][03300] Adding new argument 'no_render'=True that is not in the saved config file!
|
10279 |
+
[2023-06-21 20:07:06,014][03300] Adding new argument 'save_video'=True that is not in the saved config file!
|
10280 |
+
[2023-06-21 20:07:06,014][03300] Adding new argument 'video_frames'=1000000000.0 that is not in the saved config file!
|
10281 |
+
[2023-06-21 20:07:06,015][03300] Adding new argument 'video_name'=None that is not in the saved config file!
|
10282 |
+
[2023-06-21 20:07:06,015][03300] Adding new argument 'max_num_frames'=1000000000.0 that is not in the saved config file!
|
10283 |
+
[2023-06-21 20:07:06,015][03300] Adding new argument 'max_num_episodes'=10 that is not in the saved config file!
|
10284 |
+
[2023-06-21 20:07:06,016][03300] Adding new argument 'push_to_hub'=False that is not in the saved config file!
|
10285 |
+
[2023-06-21 20:07:06,016][03300] Adding new argument 'hf_repository'=None that is not in the saved config file!
|
10286 |
+
[2023-06-21 20:07:06,017][03300] Adding new argument 'policy_index'=0 that is not in the saved config file!
|
10287 |
+
[2023-06-21 20:07:06,017][03300] Adding new argument 'eval_deterministic'=False that is not in the saved config file!
|
10288 |
+
[2023-06-21 20:07:06,017][03300] Adding new argument 'train_script'=None that is not in the saved config file!
|
10289 |
+
[2023-06-21 20:07:06,017][03300] Adding new argument 'enjoy_script'=None that is not in the saved config file!
|
10290 |
+
[2023-06-21 20:07:06,018][03300] Using frameskip 1 and render_action_repeat=4 for evaluation
|
10291 |
+
[2023-06-21 20:07:06,023][03300] Doom resolution: 160x120, resize resolution: (128, 72)
|
10292 |
+
[2023-06-21 20:07:06,023][03300] RunningMeanStd input shape: (3, 72, 128)
|
10293 |
+
[2023-06-21 20:07:06,024][03300] RunningMeanStd input shape: (1,)
|
10294 |
+
[2023-06-21 20:07:06,034][03300] ConvEncoder: input_channels=3
|
10295 |
+
[2023-06-21 20:07:06,086][03300] Conv encoder output size: 512
|
10296 |
+
[2023-06-21 20:07:06,086][03300] Policy head output size: 512
|
10297 |
+
[2023-06-21 20:07:06,092][03300] Loading state from checkpoint /Users/md/Code/python/jubilant-memory/RL/train_dir/default_experiment/checkpoint_p0/checkpoint_000001637_6114688.pth...
|
10298 |
+
[2023-06-21 20:07:07,663][03300] Num frames 100...
|
10299 |
+
[2023-06-21 20:07:08,511][03300] Num frames 200...
|
10300 |
+
[2023-06-21 20:07:09,351][03300] Num frames 300...
|
10301 |
+
[2023-06-21 20:07:10,204][03300] Num frames 400...
|
10302 |
+
[2023-06-21 20:07:10,878][03300] Avg episode rewards: #0: 8.680, true rewards: #0: 4.680
|
10303 |
+
[2023-06-21 20:07:10,881][03300] Avg episode reward: 8.680, avg true_objective: 4.680
|
10304 |
+
[2023-06-21 20:07:11,150][03300] Num frames 500...
|
10305 |
+
[2023-06-21 20:07:12,013][03300] Num frames 600...
|
10306 |
+
[2023-06-21 20:07:12,877][03300] Num frames 700...
|
10307 |
+
[2023-06-21 20:07:13,741][03300] Num frames 800...
|
10308 |
+
[2023-06-21 20:07:14,605][03300] Num frames 900...
|
10309 |
+
[2023-06-21 20:07:15,463][03300] Num frames 1000...
|
10310 |
+
[2023-06-21 20:07:16,336][03300] Num frames 1100...
|
10311 |
+
[2023-06-21 20:07:17,178][03300] Num frames 1200...
|
10312 |
+
[2023-06-21 20:07:18,030][03300] Num frames 1300...
|
10313 |
+
[2023-06-21 20:07:18,911][03300] Num frames 1400...
|
10314 |
+
[2023-06-21 20:07:19,783][03300] Num frames 1500...
|
10315 |
+
[2023-06-21 20:07:20,668][03300] Num frames 1600...
|
10316 |
+
[2023-06-21 20:07:21,522][03300] Num frames 1700...
|
10317 |
+
[2023-06-21 20:07:22,368][03300] Num frames 1800...
|
10318 |
+
[2023-06-21 20:07:23,205][03300] Num frames 1900...
|
10319 |
+
[2023-06-21 20:07:24,079][03300] Num frames 2000...
|
10320 |
+
[2023-06-21 20:07:24,201][03300] Avg episode rewards: #0: 23.020, true rewards: #0: 10.020
|
10321 |
+
[2023-06-21 20:07:24,203][03300] Avg episode reward: 23.020, avg true_objective: 10.020
|
10322 |
+
[2023-06-21 20:07:25,021][03300] Num frames 2100...
|
10323 |
+
[2023-06-21 20:07:25,888][03300] Num frames 2200...
|
10324 |
+
[2023-06-21 20:07:26,726][03300] Num frames 2300...
|
10325 |
+
[2023-06-21 20:07:27,611][03300] Num frames 2400...
|
10326 |
+
[2023-06-21 20:07:28,457][03300] Num frames 2500...
|
10327 |
+
[2023-06-21 20:07:29,319][03300] Num frames 2600...
|
10328 |
+
[2023-06-21 20:07:30,194][03300] Num frames 2700...
|
10329 |
+
[2023-06-21 20:07:30,359][03300] Avg episode rewards: #0: 19.360, true rewards: #0: 9.027
|
10330 |
+
[2023-06-21 20:07:30,362][03300] Avg episode reward: 19.360, avg true_objective: 9.027
|
10331 |
+
[2023-06-21 20:07:31,142][03300] Num frames 2800...
|
10332 |
+
[2023-06-21 20:07:31,994][03300] Num frames 2900...
|
10333 |
+
[2023-06-21 20:07:32,874][03300] Num frames 3000...
|
10334 |
+
[2023-06-21 20:07:33,716][03300] Num frames 3100...
|
10335 |
+
[2023-06-21 20:07:34,575][03300] Num frames 3200...
|
10336 |
+
[2023-06-21 20:07:35,442][03300] Num frames 3300...
|
10337 |
+
[2023-06-21 20:07:36,286][03300] Num frames 3400...
|
10338 |
+
[2023-06-21 20:07:37,156][03300] Num frames 3500...
|
10339 |
+
[2023-06-21 20:07:37,893][03300] Avg episode rewards: #0: 18.180, true rewards: #0: 8.930
|
10340 |
+
[2023-06-21 20:07:37,896][03300] Avg episode reward: 18.180, avg true_objective: 8.930
|
10341 |
+
[2023-06-21 20:07:38,148][03300] Num frames 3600...
|
10342 |
+
[2023-06-21 20:07:39,035][03300] Num frames 3700...
|
10343 |
+
[2023-06-21 20:07:39,919][03300] Num frames 3800...
|
10344 |
+
[2023-06-21 20:07:40,790][03300] Num frames 3900...
|
10345 |
+
[2023-06-21 20:07:41,643][03300] Num frames 4000...
|
10346 |
+
[2023-06-21 20:07:42,508][03300] Num frames 4100...
|
10347 |
+
[2023-06-21 20:07:43,327][03300] Num frames 4200...
|
10348 |
+
[2023-06-21 20:07:44,046][03300] Num frames 4300...
|
10349 |
+
[2023-06-21 20:07:44,708][03300] Avg episode rewards: #0: 17.944, true rewards: #0: 8.744
|
10350 |
+
[2023-06-21 20:07:44,710][03300] Avg episode reward: 17.944, avg true_objective: 8.744
|
10351 |
+
[2023-06-21 20:07:44,942][03300] Num frames 4400...
|
10352 |
+
[2023-06-21 20:07:45,796][03300] Num frames 4500...
|
10353 |
+
[2023-06-21 20:07:46,646][03300] Num frames 4600...
|
10354 |
+
[2023-06-21 20:07:47,504][03300] Num frames 4700...
|
10355 |
+
[2023-06-21 20:07:48,368][03300] Num frames 4800...
|
10356 |
+
[2023-06-21 20:07:49,240][03300] Num frames 4900...
|
10357 |
+
[2023-06-21 20:07:50,103][03300] Num frames 5000...
|
10358 |
+
[2023-06-21 20:07:50,990][03300] Num frames 5100...
|
10359 |
+
[2023-06-21 20:07:51,873][03300] Num frames 5200...
|
10360 |
+
[2023-06-21 20:07:52,702][03300] Num frames 5300...
|
10361 |
+
[2023-06-21 20:07:53,523][03300] Num frames 5400...
|
10362 |
+
[2023-06-21 20:07:54,380][03300] Num frames 5500...
|
10363 |
+
[2023-06-21 20:07:55,259][03300] Num frames 5600...
|
10364 |
+
[2023-06-21 20:07:56,102][03300] Num frames 5700...
|
10365 |
+
[2023-06-21 20:07:56,972][03300] Num frames 5800...
|
10366 |
+
[2023-06-21 20:07:57,826][03300] Num frames 5900...
|
10367 |
+
[2023-06-21 20:07:58,679][03300] Num frames 6000...
|
10368 |
+
[2023-06-21 20:07:59,568][03300] Num frames 6100...
|
10369 |
+
[2023-06-21 20:08:00,466][03300] Num frames 6200...
|
10370 |
+
[2023-06-21 20:08:01,328][03300] Num frames 6300...
|
10371 |
+
[2023-06-21 20:08:02,202][03300] Num frames 6400...
|
10372 |
+
[2023-06-21 20:08:02,552][03300] Avg episode rewards: #0: 24.715, true rewards: #0: 10.715
|
10373 |
+
[2023-06-21 20:08:02,554][03300] Avg episode reward: 24.715, avg true_objective: 10.715
|
10374 |
+
[2023-06-21 20:08:03,175][03300] Num frames 6500...
|
10375 |
+
[2023-06-21 20:08:04,026][03300] Num frames 6600...
|
10376 |
+
[2023-06-21 20:08:04,901][03300] Num frames 6700...
|
10377 |
+
[2023-06-21 20:08:05,783][03300] Num frames 6800...
|
10378 |
+
[2023-06-21 20:08:06,639][03300] Num frames 6900...
|
10379 |
+
[2023-06-21 20:08:07,523][03300] Num frames 7000...
|
10380 |
+
[2023-06-21 20:08:08,398][03300] Num frames 7100...
|
10381 |
+
[2023-06-21 20:08:09,287][03300] Num frames 7200...
|
10382 |
+
[2023-06-21 20:08:10,069][03300] Avg episode rewards: #0: 23.967, true rewards: #0: 10.396
|
10383 |
+
[2023-06-21 20:08:10,072][03300] Avg episode reward: 23.967, avg true_objective: 10.396
|
10384 |
+
[2023-06-21 20:08:10,268][03300] Num frames 7300...
|
10385 |
+
[2023-06-21 20:08:11,157][03300] Num frames 7400...
|
10386 |
+
[2023-06-21 20:08:12,034][03300] Num frames 7500...
|
10387 |
+
[2023-06-21 20:08:12,871][03300] Num frames 7600...
|
10388 |
+
[2023-06-21 20:08:13,723][03300] Num frames 7700...
|
10389 |
+
[2023-06-21 20:08:14,579][03300] Num frames 7800...
|
10390 |
+
[2023-06-21 20:08:15,440][03300] Num frames 7900...
|
10391 |
+
[2023-06-21 20:08:16,319][03300] Num frames 8000...
|
10392 |
+
[2023-06-21 20:08:17,093][03300] Avg episode rewards: #0: 23.096, true rewards: #0: 10.096
|
10393 |
+
[2023-06-21 20:08:17,096][03300] Avg episode reward: 23.096, avg true_objective: 10.096
|
10394 |
+
[2023-06-21 20:08:17,283][03300] Num frames 8100...
|
10395 |
+
[2023-06-21 20:08:18,140][03300] Num frames 8200...
|
10396 |
+
[2023-06-21 20:08:18,980][03300] Num frames 8300...
|
10397 |
+
[2023-06-21 20:08:19,820][03300] Num frames 8400...
|
10398 |
+
[2023-06-21 20:08:20,672][03300] Num frames 8500...
|
10399 |
+
[2023-06-21 20:08:21,544][03300] Num frames 8600...
|
10400 |
+
[2023-06-21 20:08:21,820][03300] Avg episode rewards: #0: 21.468, true rewards: #0: 9.579
|
10401 |
+
[2023-06-21 20:08:21,823][03300] Avg episode reward: 21.468, avg true_objective: 9.579
|
10402 |
+
[2023-06-21 20:08:22,518][03300] Num frames 8700...
|
10403 |
+
[2023-06-21 20:08:23,385][03300] Num frames 8800...
|
10404 |
+
[2023-06-21 20:08:24,248][03300] Num frames 8900...
|
10405 |
+
[2023-06-21 20:08:24,651][03300] Avg episode rewards: #0: 19.835, true rewards: #0: 8.935
|
10406 |
+
[2023-06-21 20:08:24,654][03300] Avg episode reward: 19.835, avg true_objective: 8.935
|
10407 |
+
[2023-06-21 20:08:37,583][03300] Replay video saved to /Users/md/Code/python/jubilant-memory/RL/train_dir/default_experiment/replay.mp4!
|
10408 |
+
[2023-06-21 20:08:48,389][03300] Loading existing experiment configuration from /Users/md/Code/python/jubilant-memory/RL/train_dir/default_experiment/config.json
|
10409 |
+
[2023-06-21 20:08:48,390][03300] Overriding arg 'num_workers' with value 1 passed from command line
|
10410 |
+
[2023-06-21 20:08:48,391][03300] Adding new argument 'no_render'=True that is not in the saved config file!
|
10411 |
+
[2023-06-21 20:08:48,391][03300] Adding new argument 'save_video'=True that is not in the saved config file!
|
10412 |
+
[2023-06-21 20:08:48,391][03300] Adding new argument 'video_frames'=1000000000.0 that is not in the saved config file!
|
10413 |
+
[2023-06-21 20:08:48,392][03300] Adding new argument 'video_name'=None that is not in the saved config file!
|
10414 |
+
[2023-06-21 20:08:48,392][03300] Adding new argument 'max_num_frames'=100000 that is not in the saved config file!
|
10415 |
+
[2023-06-21 20:08:48,393][03300] Adding new argument 'max_num_episodes'=10 that is not in the saved config file!
|
10416 |
+
[2023-06-21 20:08:48,394][03300] Adding new argument 'push_to_hub'=True that is not in the saved config file!
|
10417 |
+
[2023-06-21 20:08:48,394][03300] Adding new argument 'hf_repository'='mihirdeo16/vizdoom_health_gathering_supreme' that is not in the saved config file!
|
10418 |
+
[2023-06-21 20:08:48,395][03300] Adding new argument 'policy_index'=0 that is not in the saved config file!
|
10419 |
+
[2023-06-21 20:08:48,395][03300] Adding new argument 'eval_deterministic'=False that is not in the saved config file!
|
10420 |
+
[2023-06-21 20:08:48,396][03300] Adding new argument 'train_script'=None that is not in the saved config file!
|
10421 |
+
[2023-06-21 20:08:48,396][03300] Adding new argument 'enjoy_script'=None that is not in the saved config file!
|
10422 |
+
[2023-06-21 20:08:48,396][03300] Using frameskip 1 and render_action_repeat=4 for evaluation
|
10423 |
+
[2023-06-21 20:08:48,402][03300] RunningMeanStd input shape: (3, 72, 128)
|
10424 |
+
[2023-06-21 20:08:48,403][03300] RunningMeanStd input shape: (1,)
|
10425 |
+
[2023-06-21 20:08:48,410][03300] ConvEncoder: input_channels=3
|
10426 |
+
[2023-06-21 20:08:48,425][03300] Conv encoder output size: 512
|
10427 |
+
[2023-06-21 20:08:48,425][03300] Policy head output size: 512
|
10428 |
+
[2023-06-21 20:08:48,431][03300] Loading state from checkpoint /Users/md/Code/python/jubilant-memory/RL/train_dir/default_experiment/checkpoint_p0/checkpoint_000001637_6114688.pth...
|
10429 |
+
[2023-06-21 20:08:50,025][03300] Num frames 100...
|
10430 |
+
[2023-06-21 20:08:50,876][03300] Num frames 200...
|
10431 |
+
[2023-06-21 20:08:51,777][03300] Num frames 300...
|
10432 |
+
[2023-06-21 20:08:52,671][03300] Num frames 400...
|
10433 |
+
[2023-06-21 20:08:53,543][03300] Num frames 500...
|
10434 |
+
[2023-06-21 20:08:54,430][03300] Num frames 600...
|
10435 |
+
[2023-06-21 20:08:55,320][03300] Num frames 700...
|
10436 |
+
[2023-06-21 20:08:56,026][03300] Avg episode rewards: #0: 15.680, true rewards: #0: 7.680
|
10437 |
+
[2023-06-21 20:08:56,028][03300] Avg episode reward: 15.680, avg true_objective: 7.680
|
10438 |
+
[2023-06-21 20:08:56,308][03300] Num frames 800...
|
10439 |
+
[2023-06-21 20:08:57,182][03300] Num frames 900...
|
10440 |
+
[2023-06-21 20:08:58,074][03300] Num frames 1000...
|
10441 |
+
[2023-06-21 20:08:58,962][03300] Num frames 1100...
|
10442 |
+
[2023-06-21 20:08:59,853][03300] Num frames 1200...
|
10443 |
+
[2023-06-21 20:09:00,780][03300] Num frames 1300...
|
10444 |
+
[2023-06-21 20:09:01,662][03300] Num frames 1400...
|
10445 |
+
[2023-06-21 20:09:02,547][03300] Num frames 1500...
|
10446 |
+
[2023-06-21 20:09:03,396][03300] Avg episode rewards: #0: 17.430, true rewards: #0: 7.930
|
10447 |
+
[2023-06-21 20:09:03,399][03300] Avg episode reward: 17.430, avg true_objective: 7.930
|
10448 |
+
[2023-06-21 20:09:03,516][03300] Num frames 1600...
|
10449 |
+
[2023-06-21 20:09:04,394][03300] Num frames 1700...
|
10450 |
+
[2023-06-21 20:09:05,309][03300] Num frames 1800...
|
10451 |
+
[2023-06-21 20:09:06,167][03300] Num frames 1900...
|
10452 |
+
[2023-06-21 20:09:07,043][03300] Num frames 2000...
|
10453 |
+
[2023-06-21 20:09:07,961][03300] Num frames 2100...
|
10454 |
+
[2023-06-21 20:09:08,610][03300] Avg episode rewards: #0: 14.873, true rewards: #0: 7.207
|
10455 |
+
[2023-06-21 20:09:08,612][03300] Avg episode reward: 14.873, avg true_objective: 7.207
|
10456 |
+
[2023-06-21 20:09:08,949][03300] Num frames 2200...
|
10457 |
+
[2023-06-21 20:09:09,827][03300] Num frames 2300...
|
10458 |
+
[2023-06-21 20:09:10,698][03300] Num frames 2400...
|
10459 |
+
[2023-06-21 20:09:11,591][03300] Num frames 2500...
|
10460 |
+
[2023-06-21 20:09:12,482][03300] Num frames 2600...
|
10461 |
+
[2023-06-21 20:09:13,425][03300] Num frames 2700...
|
10462 |
+
[2023-06-21 20:09:14,327][03300] Num frames 2800...
|
10463 |
+
[2023-06-21 20:09:15,210][03300] Num frames 2900...
|
10464 |
+
[2023-06-21 20:09:16,100][03300] Num frames 3000...
|
10465 |
+
[2023-06-21 20:09:16,989][03300] Num frames 3100...
|
10466 |
+
[2023-06-21 20:09:17,855][03300] Num frames 3200...
|
10467 |
+
[2023-06-21 20:09:18,714][03300] Num frames 3300...
|
10468 |
+
[2023-06-21 20:09:19,612][03300] Num frames 3400...
|
10469 |
+
[2023-06-21 20:09:20,489][03300] Num frames 3500...
|
10470 |
+
[2023-06-21 20:09:21,398][03300] Num frames 3600...
|
10471 |
+
[2023-06-21 20:09:22,288][03300] Num frames 3700...
|
10472 |
+
[2023-06-21 20:09:23,143][03300] Num frames 3800...
|
10473 |
+
[2023-06-21 20:09:24,033][03300] Num frames 3900...
|
10474 |
+
[2023-06-21 20:09:24,648][03300] Avg episode rewards: #0: 22.897, true rewards: #0: 9.897
|
10475 |
+
[2023-06-21 20:09:24,651][03300] Avg episode reward: 22.897, avg true_objective: 9.897
|
10476 |
+
[2023-06-21 20:09:25,017][03300] Num frames 4000...
|
10477 |
+
[2023-06-21 20:09:25,887][03300] Num frames 4100...
|
10478 |
+
[2023-06-21 20:09:26,806][03300] Num frames 4200...
|
10479 |
+
[2023-06-21 20:09:27,693][03300] Num frames 4300...
|
10480 |
+
[2023-06-21 20:09:28,556][03300] Num frames 4400...
|
10481 |
+
[2023-06-21 20:09:29,456][03300] Num frames 4500...
|
10482 |
+
[2023-06-21 20:09:30,389][03300] Num frames 4600...
|
10483 |
+
[2023-06-21 20:09:31,287][03300] Num frames 4700...
|
10484 |
+
[2023-06-21 20:09:32,165][03300] Num frames 4800...
|
10485 |
+
[2023-06-21 20:09:33,049][03300] Num frames 4900...
|
10486 |
+
[2023-06-21 20:09:33,922][03300] Num frames 5000...
|
10487 |
+
[2023-06-21 20:09:34,709][03300] Avg episode rewards: #0: 22.758, true rewards: #0: 10.158
|
10488 |
+
[2023-06-21 20:09:34,712][03300] Avg episode reward: 22.758, avg true_objective: 10.158
|
10489 |
+
[2023-06-21 20:09:34,890][03300] Num frames 5100...
|
10490 |
+
[2023-06-21 20:09:35,771][03300] Num frames 5200...
|
10491 |
+
[2023-06-21 20:09:36,673][03300] Num frames 5300...
|
10492 |
+
[2023-06-21 20:09:37,552][03300] Num frames 5400...
|
10493 |
+
[2023-06-21 20:09:38,434][03300] Num frames 5500...
|
10494 |
+
[2023-06-21 20:09:39,311][03300] Num frames 5600...
|
10495 |
+
[2023-06-21 20:09:40,213][03300] Num frames 5700...
|
10496 |
+
[2023-06-21 20:09:41,098][03300] Num frames 5800...
|
10497 |
+
[2023-06-21 20:09:41,978][03300] Num frames 5900...
|
10498 |
+
[2023-06-21 20:09:42,893][03300] Num frames 6000...
|
10499 |
+
[2023-06-21 20:09:43,720][03300] Num frames 6100...
|
10500 |
+
[2023-06-21 20:09:44,422][03300] Num frames 6200...
|
10501 |
+
[2023-06-21 20:09:45,214][03300] Num frames 6300...
|
10502 |
+
[2023-06-21 20:09:46,139][03300] Num frames 6400...
|
10503 |
+
[2023-06-21 20:09:46,992][03300] Num frames 6500...
|
10504 |
+
[2023-06-21 20:09:47,677][03300] Avg episode rewards: #0: 25.777, true rewards: #0: 10.943
|
10505 |
+
[2023-06-21 20:09:47,679][03300] Avg episode reward: 25.777, avg true_objective: 10.943
|
10506 |
+
[2023-06-21 20:09:47,982][03300] Num frames 6600...
|
10507 |
+
[2023-06-21 20:09:48,892][03300] Num frames 6700...
|
10508 |
+
[2023-06-21 20:09:49,800][03300] Num frames 6800...
|
10509 |
+
[2023-06-21 20:09:50,701][03300] Num frames 6900...
|
10510 |
+
[2023-06-21 20:09:51,572][03300] Num frames 7000...
|
10511 |
+
[2023-06-21 20:09:52,408][03300] Num frames 7100...
|
10512 |
+
[2023-06-21 20:09:53,196][03300] Num frames 7200...
|
10513 |
+
[2023-06-21 20:09:53,984][03300] Num frames 7300...
|
10514 |
+
[2023-06-21 20:09:54,880][03300] Num frames 7400...
|
10515 |
+
[2023-06-21 20:09:55,782][03300] Num frames 7500...
|
10516 |
+
[2023-06-21 20:09:56,675][03300] Num frames 7600...
|
10517 |
+
[2023-06-21 20:09:57,545][03300] Num frames 7700...
|
10518 |
+
[2023-06-21 20:09:58,416][03300] Num frames 7800...
|
10519 |
+
[2023-06-21 20:09:59,321][03300] Num frames 7900...
|
10520 |
+
[2023-06-21 20:10:00,190][03300] Num frames 8000...
|
10521 |
+
[2023-06-21 20:10:01,075][03300] Num frames 8100...
|
10522 |
+
[2023-06-21 20:10:01,964][03300] Num frames 8200...
|
10523 |
+
[2023-06-21 20:10:02,616][03300] Avg episode rewards: #0: 27.517, true rewards: #0: 11.803
|
10524 |
+
[2023-06-21 20:10:02,619][03300] Avg episode reward: 27.517, avg true_objective: 11.803
|
10525 |
+
[2023-06-21 20:10:02,949][03300] Num frames 8300...
|
10526 |
+
[2023-06-21 20:10:03,830][03300] Num frames 8400...
|
10527 |
+
[2023-06-21 20:10:04,681][03300] Num frames 8500...
|
10528 |
+
[2023-06-21 20:10:05,555][03300] Num frames 8600...
|
10529 |
+
[2023-06-21 20:10:06,435][03300] Num frames 8700...
|
10530 |
+
[2023-06-21 20:10:07,302][03300] Num frames 8800...
|
10531 |
+
[2023-06-21 20:10:08,156][03300] Num frames 8900...
|
10532 |
+
[2023-06-21 20:10:09,030][03300] Num frames 9000...
|
10533 |
+
[2023-06-21 20:10:09,896][03300] Num frames 9100...
|
10534 |
+
[2023-06-21 20:10:10,752][03300] Num frames 9200...
|
10535 |
+
[2023-06-21 20:10:11,621][03300] Num frames 9300...
|
10536 |
+
[2023-06-21 20:10:12,495][03300] Num frames 9400...
|
10537 |
+
[2023-06-21 20:10:13,355][03300] Num frames 9500...
|
10538 |
+
[2023-06-21 20:10:14,201][03300] Num frames 9600...
|
10539 |
+
[2023-06-21 20:10:14,883][03300] Avg episode rewards: #0: 28.331, true rewards: #0: 12.081
|
10540 |
+
[2023-06-21 20:10:14,885][03300] Avg episode reward: 28.331, avg true_objective: 12.081
|
10541 |
+
[2023-06-21 20:10:15,193][03300] Num frames 9700...
|
10542 |
+
[2023-06-21 20:10:16,066][03300] Num frames 9800...
|
10543 |
+
[2023-06-21 20:10:16,924][03300] Num frames 9900...
|
10544 |
+
[2023-06-21 20:10:17,800][03300] Avg episode rewards: #0: 25.878, true rewards: #0: 11.100
|
10545 |
+
[2023-06-21 20:10:17,803][03300] Avg episode reward: 25.878, avg true_objective: 11.100
|
10546 |
+
[2023-06-21 20:10:17,887][03300] Num frames 10000...
|
10547 |
+
[2023-06-21 20:10:18,743][03300] Num frames 10100...
|
10548 |
+
[2023-06-21 20:10:19,626][03300] Num frames 10200...
|
10549 |
+
[2023-06-21 20:10:20,496][03300] Num frames 10300...
|
10550 |
+
[2023-06-21 20:10:21,379][03300] Num frames 10400...
|
10551 |
+
[2023-06-21 20:10:22,247][03300] Num frames 10500...
|
10552 |
+
[2023-06-21 20:10:23,101][03300] Num frames 10600...
|
10553 |
+
[2023-06-21 20:10:23,993][03300] Num frames 10700...
|
10554 |
+
[2023-06-21 20:10:24,325][03300] Avg episode rewards: #0: 24.626, true rewards: #0: 10.726
|
10555 |
+
[2023-06-21 20:10:24,328][03300] Avg episode reward: 24.626, avg true_objective: 10.726
|
10556 |
+
[2023-06-21 20:10:38,574][03300] Replay video saved to /Users/md/Code/python/jubilant-memory/RL/train_dir/default_experiment/replay.mp4!
|