moisesrobles04 commited on
Commit
c458809
·
1 Parent(s): ec9ad3a

Initial commit

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
- value: 223.50 +/- 89.39
20
  name: mean_reward
21
  verified: false
22
  ---
@@ -62,21 +62,21 @@ python -m rl_zoo3.push_to_hub --algo dqn --env SpaceInvadersNoFrameskip-v4 -f lo
62
 
63
  ## Hyperparameters
64
  ```python
65
- OrderedDict([('batch_size', 64),
66
- ('buffer_size', 100000),
67
  ('env_wrapper',
68
  ['stable_baselines3.common.atari_wrappers.AtariWrapper']),
69
  ('exploration_final_eps', 0.01),
70
  ('exploration_fraction', 0.1),
71
- ('frame_stack', 4),
72
  ('gradient_steps', 1),
73
- ('learning_rate', 0.001),
74
  ('learning_starts', 100000),
75
- ('n_timesteps', 800000.0),
76
  ('optimize_memory_usage', False),
77
  ('policy', 'CnnPolicy'),
78
  ('target_update_interval', 1000),
79
- ('train_freq', 4),
80
  ('normalize', False)])
81
  ```
82
 
 
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 268.50 +/- 78.17
20
  name: mean_reward
21
  verified: false
22
  ---
 
62
 
63
  ## Hyperparameters
64
  ```python
65
+ OrderedDict([('batch_size', 128),
66
+ ('buffer_size', 101000),
67
  ('env_wrapper',
68
  ['stable_baselines3.common.atari_wrappers.AtariWrapper']),
69
  ('exploration_final_eps', 0.01),
70
  ('exploration_fraction', 0.1),
71
+ ('frame_stack', 5),
72
  ('gradient_steps', 1),
73
+ ('learning_rate', 0.03),
74
  ('learning_starts', 100000),
75
+ ('n_timesteps', 900000.0),
76
  ('optimize_memory_usage', False),
77
  ('policy', 'CnnPolicy'),
78
  ('target_update_interval', 1000),
79
+ ('train_freq', 5),
80
  ('normalize', False)])
81
  ```
82
 
args.yml CHANGED
@@ -54,7 +54,7 @@
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
- - 122165829
58
  - - storage
59
  - null
60
  - - study_name
 
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
+ - 2359424619
58
  - - storage
59
  - null
60
  - - study_name
config.yml CHANGED
@@ -1,8 +1,8 @@
1
  !!python/object/apply:collections.OrderedDict
2
  - - - batch_size
3
- - 64
4
  - - buffer_size
5
- - 100000
6
  - - env_wrapper
7
  - - stable_baselines3.common.atari_wrappers.AtariWrapper
8
  - - exploration_final_eps
@@ -10,15 +10,15 @@
10
  - - exploration_fraction
11
  - 0.1
12
  - - frame_stack
13
- - 4
14
  - - gradient_steps
15
  - 1
16
  - - learning_rate
17
- - 0.001
18
  - - learning_starts
19
  - 100000
20
  - - n_timesteps
21
- - 800000.0
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
@@ -26,4 +26,4 @@
26
  - - target_update_interval
27
  - 1000
28
  - - train_freq
29
- - 4
 
1
  !!python/object/apply:collections.OrderedDict
2
  - - - batch_size
3
+ - 128
4
  - - buffer_size
5
+ - 101000
6
  - - env_wrapper
7
  - - stable_baselines3.common.atari_wrappers.AtariWrapper
8
  - - exploration_final_eps
 
10
  - - exploration_fraction
11
  - 0.1
12
  - - frame_stack
13
+ - 5
14
  - - gradient_steps
15
  - 1
16
  - - learning_rate
17
+ - 0.03
18
  - - learning_starts
19
  - 100000
20
  - - n_timesteps
21
+ - 900000.0
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
 
26
  - - target_update_interval
27
  - 1000
28
  - - train_freq
29
+ - 5
dqn-SpaceInvadersNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:47db1150cdd059039a22520123f465ec108ba6a4cbe7fad0e9d07d4e187c2ad3
3
- size 27218381
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eebb804468132ec5da5194fa3e91a2faf3229085379e55d92d25203ae64c3350
3
+ size 27299107
dqn-SpaceInvadersNoFrameskip-v4/data CHANGED
The diff for this file is too large to render. See raw diff
 
dqn-SpaceInvadersNoFrameskip-v4/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b19263a327fe6a9b664437c52cf77407c7a33078bea1cccf04d6ae8ba39a7621
3
- size 13505739
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e4e8e1547e024fb27953de879cef7aefda49b04e6c81fb2ba3697adf55093c0
3
+ size 13522123
dqn-SpaceInvadersNoFrameskip-v4/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1a43008a3c7cb53adef164e80bbd0424b8a2d480e874101e74cd3b8451ead551
3
- size 13504937
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66ab046edc1867018c60a39335720001e38df131b9119d67b216694a68e5770f
3
+ size 13521321
dqn-SpaceInvadersNoFrameskip-v4/system_info.txt CHANGED
@@ -1,9 +1,9 @@
1
  - OS: Linux-5.15.109+-x86_64-with-glibc2.35 # 1 SMP Fri Jun 9 10:57:30 UTC 2023
2
- - Python: 3.10.6
3
  - Stable-Baselines3: 2.0.0
4
  - PyTorch: 2.0.1+cu118
5
  - GPU Enabled: True
6
- - Numpy: 1.22.4
7
  - Cloudpickle: 2.2.1
8
  - Gymnasium: 0.28.1
9
  - OpenAI Gym: 0.26.2
 
1
  - OS: Linux-5.15.109+-x86_64-with-glibc2.35 # 1 SMP Fri Jun 9 10:57:30 UTC 2023
2
+ - Python: 3.10.12
3
  - Stable-Baselines3: 2.0.0
4
  - PyTorch: 2.0.1+cu118
5
  - GPU Enabled: True
6
+ - Numpy: 1.23.5
7
  - Cloudpickle: 2.2.1
8
  - Gymnasium: 0.28.1
9
  - OpenAI Gym: 0.26.2
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:45c22dea565ea383fff3bc509d502adf0a52a1b963f654e167c3ac3df4c52175
3
- size 278865
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38a799ac9657faeb813344ec56ae265d381f35a430091e2c90337e271719a9db
3
+ size 278674
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 223.5, "std_reward": 89.38819832617726, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-07-20T18:25:43.430477"}
 
1
+ {"mean_reward": 268.5, "std_reward": 78.16808811785025, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-08-10T14:35:33.969344"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ba3494e7d91cb5b40bef174b8d76a6fd17e2e50ccb7e4d67b256cdb3e2b3d346
3
- size 33730
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:917e410675e577ba80b0fba6d9606ef82821fa1fb9e016da330a927526492397
3
+ size 37830