Initial commit
Browse files- README.md +2 -2
- args.yml +2 -2
- config.yml +1 -1
- dqn-SpaceInvadersNoFrameskip-v4.zip +2 -2
- dqn-SpaceInvadersNoFrameskip-v4/_stable_baselines3_version +1 -1
- dqn-SpaceInvadersNoFrameskip-v4/data +0 -0
- dqn-SpaceInvadersNoFrameskip-v4/policy.optimizer.pth +2 -2
- dqn-SpaceInvadersNoFrameskip-v4/policy.pth +1 -1
- dqn-SpaceInvadersNoFrameskip-v4/system_info.txt +7 -7
- replay.mp4 +2 -2
- results.json +1 -1
- train_eval_metrics.zip +2 -2
README.md
CHANGED
@@ -16,7 +16,7 @@ model-index:
|
|
16 |
type: SpaceInvadersNoFrameskip-v4
|
17 |
metrics:
|
18 |
- type: mean_reward
|
19 |
-
value:
|
20 |
name: mean_reward
|
21 |
verified: false
|
22 |
---
|
@@ -72,7 +72,7 @@ OrderedDict([('batch_size', 32),
|
|
72 |
('gradient_steps', 1),
|
73 |
('learning_rate', 0.0001),
|
74 |
('learning_starts', 100000),
|
75 |
-
('n_timesteps',
|
76 |
('optimize_memory_usage', False),
|
77 |
('policy', 'CnnPolicy'),
|
78 |
('target_update_interval', 1000),
|
|
|
16 |
type: SpaceInvadersNoFrameskip-v4
|
17 |
metrics:
|
18 |
- type: mean_reward
|
19 |
+
value: 1124.00 +/- 189.17
|
20 |
name: mean_reward
|
21 |
verified: false
|
22 |
---
|
|
|
72 |
('gradient_steps', 1),
|
73 |
('learning_rate', 0.0001),
|
74 |
('learning_starts', 100000),
|
75 |
+
('n_timesteps', 10000000.0),
|
76 |
('optimize_memory_usage', False),
|
77 |
('policy', 'CnnPolicy'),
|
78 |
('target_update_interval', 1000),
|
args.yml
CHANGED
@@ -20,7 +20,7 @@
|
|
20 |
- - hyperparams
|
21 |
- null
|
22 |
- - log_folder
|
23 |
-
- logs
|
24 |
- - log_interval
|
25 |
- -1
|
26 |
- - max_total_trials
|
@@ -56,7 +56,7 @@
|
|
56 |
- - save_replay_buffer
|
57 |
- false
|
58 |
- - seed
|
59 |
-
-
|
60 |
- - storage
|
61 |
- null
|
62 |
- - study_name
|
|
|
20 |
- - hyperparams
|
21 |
- null
|
22 |
- - log_folder
|
23 |
+
- /home/luyang/logs
|
24 |
- - log_interval
|
25 |
- -1
|
26 |
- - max_total_trials
|
|
|
56 |
- - save_replay_buffer
|
57 |
- false
|
58 |
- - seed
|
59 |
+
- 334622670
|
60 |
- - storage
|
61 |
- null
|
62 |
- - study_name
|
config.yml
CHANGED
@@ -18,7 +18,7 @@
|
|
18 |
- - learning_starts
|
19 |
- 100000
|
20 |
- - n_timesteps
|
21 |
-
-
|
22 |
- - optimize_memory_usage
|
23 |
- false
|
24 |
- - policy
|
|
|
18 |
- - learning_starts
|
19 |
- 100000
|
20 |
- - n_timesteps
|
21 |
+
- 10000000.0
|
22 |
- - optimize_memory_usage
|
23 |
- false
|
24 |
- - policy
|
dqn-SpaceInvadersNoFrameskip-v4.zip
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f31e8b4af033c662bd94dccdf6c8e60eaca2e858e242163e28776096a334e90
|
3 |
+
size 27221776
|
dqn-SpaceInvadersNoFrameskip-v4/_stable_baselines3_version
CHANGED
@@ -1 +1 @@
|
|
1 |
-
2.
|
|
|
1 |
+
2.3.2
|
dqn-SpaceInvadersNoFrameskip-v4/data
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
dqn-SpaceInvadersNoFrameskip-v4/policy.optimizer.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:de4c2926f26728409481b19f1ede6562098191066e83d9400d3bbfb729fd58af
|
3 |
+
size 13506236
|
dqn-SpaceInvadersNoFrameskip-v4/policy.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 13505370
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a772f6f7543493ef07ad1d044ac45f2ebe29601fd84416c907c7694efd56dd1b
|
3 |
size 13505370
|
dqn-SpaceInvadersNoFrameskip-v4/system_info.txt
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
-
- OS: Linux-6.
|
2 |
-
- Python: 3.
|
3 |
-
- Stable-Baselines3: 2.
|
4 |
-
- PyTorch: 2.4.
|
5 |
- GPU Enabled: True
|
6 |
-
- Numpy: 1.
|
7 |
-
- Cloudpickle:
|
8 |
- Gymnasium: 0.29.1
|
9 |
-
- OpenAI Gym: 0.
|
|
|
1 |
+
- OS: Linux-6.8.0-41-generic-x86_64-with-glibc2.39 # 41-Ubuntu SMP PREEMPT_DYNAMIC Fri Aug 2 20:41:06 UTC 2024
|
2 |
+
- Python: 3.11.9
|
3 |
+
- Stable-Baselines3: 2.3.2
|
4 |
+
- PyTorch: 2.4.1+cu121
|
5 |
- GPU Enabled: True
|
6 |
+
- Numpy: 2.1.1
|
7 |
+
- Cloudpickle: 3.0.0
|
8 |
- Gymnasium: 0.29.1
|
9 |
+
- OpenAI Gym: 0.26.2
|
replay.mp4
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a1d4773ccf89b75620f30d80693532997bdb93df145e260e4f20e9deb830cbe9
|
3 |
+
size 213961
|
results.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"mean_reward":
|
|
|
1 |
+
{"mean_reward": 1124.0, "std_reward": 189.16659324521336, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2024-09-16T02:42:52.180832"}
|
train_eval_metrics.zip
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:65c80a6b65d04b4e1fe46a3e40bf67fbff4073c1420c80c8065ece8a4552831f
|
3 |
+
size 260817
|