juanzinser commited on
Commit
8d85f5f
·
1 Parent(s): 86fb22c

Initial commit

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
- value: 169.00 +/- 59.70
20
  name: mean_reward
21
  verified: false
22
  ---
@@ -72,7 +72,7 @@ OrderedDict([('batch_size', 32),
72
  ('gradient_steps', 1),
73
  ('learning_rate', 0.0001),
74
  ('learning_starts', 100000),
75
- ('n_timesteps', 400000.0),
76
  ('optimize_memory_usage', False),
77
  ('policy', 'CnnPolicy'),
78
  ('target_update_interval', 1000),
 
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 533.50 +/- 195.41
20
  name: mean_reward
21
  verified: false
22
  ---
 
72
  ('gradient_steps', 1),
73
  ('learning_rate', 0.0001),
74
  ('learning_starts', 100000),
75
+ ('n_timesteps', 1000000.0),
76
  ('optimize_memory_usage', False),
77
  ('policy', 'CnnPolicy'),
78
  ('target_update_interval', 1000),
args.yml CHANGED
@@ -54,7 +54,7 @@
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
- - 355918235
58
  - - storage
59
  - null
60
  - - study_name
 
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
+ - 128780410
58
  - - storage
59
  - null
60
  - - study_name
config.yml CHANGED
@@ -18,7 +18,7 @@
18
  - - learning_starts
19
  - 100000
20
  - - n_timesteps
21
- - 400000.0
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
 
18
  - - learning_starts
19
  - 100000
20
  - - n_timesteps
21
+ - 1000000.0
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
dqn-SpaceInvadersNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:167438c99f196b30a33081c58ccd81d069e9065db9fd8cf7efbd77f5a3ef5810
3
- size 27220784
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c954551262ca01a78ed94d86090cf1ed4cc1e9e59282a2db78d2260b51544ba5
3
+ size 27220788
dqn-SpaceInvadersNoFrameskip-v4/data CHANGED
The diff for this file is too large to render. See raw diff
 
dqn-SpaceInvadersNoFrameskip-v4/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9be98eaf9486df45a614cfa6193e9f3d35b185badb2773cbada9c4e1138f98af
3
  size 13506236
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc38e8606d40520810c12de46f52441536cfa815b51a707eb6c0e193f2c3350d
3
  size 13506236
dqn-SpaceInvadersNoFrameskip-v4/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:76b0627f4a8096f038f51682e6518724d257e867f1cb98c3c61906feea1bc0b8
3
  size 13505370
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b413478c840efc8ad0e7f2d8adf556a29c4ea2576e5cb066183a2d2c94389bb0
3
  size 13505370
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:556df3839236d381767bece908c13132dfbcaf17bb80e589fbce866807dbd49b
3
- size 248068
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88c7a4f4c27fa5733daf67c32648113c3fa5b2af9ccc9cd9a5ec2038258aacc3
3
+ size 251372
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 169.0, "std_reward": 59.6992462263972, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2024-05-29T20:38:52.153016"}
 
1
+ {"mean_reward": 533.5, "std_reward": 195.41046543110224, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2024-06-01T00:32:38.404283"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dad63d50e525f63fcee6b756aeca2fc08cb39b65675bd36bba722f6885c9501c
3
- size 18521
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73283ec29bc30554f5fe63c3dd29df70076119174115c4af7d09597739db2c11
3
+ size 35597