babakc commited on
Commit
254db30
·
1 Parent(s): 2327bae

Initial commit

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
- value: 498.50 +/- 100.10
20
  name: mean_reward
21
  verified: false
22
  ---
@@ -72,7 +72,7 @@ OrderedDict([('batch_size', 32),
72
  ('gradient_steps', 1),
73
  ('learning_rate', 0.0001),
74
  ('learning_starts', 100000),
75
- ('n_timesteps', 1000000.0),
76
  ('optimize_memory_usage', False),
77
  ('policy', 'CnnPolicy'),
78
  ('target_update_interval', 1000),
 
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 539.00 +/- 147.95
20
  name: mean_reward
21
  verified: false
22
  ---
 
72
  ('gradient_steps', 1),
73
  ('learning_rate', 0.0001),
74
  ('learning_starts', 100000),
75
+ ('n_timesteps', 2000000.0),
76
  ('optimize_memory_usage', False),
77
  ('policy', 'CnnPolicy'),
78
  ('target_update_interval', 1000),
args.yml CHANGED
@@ -54,7 +54,7 @@
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
- - 726430265
58
  - - storage
59
  - null
60
  - - study_name
 
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
+ - 3969500058
58
  - - storage
59
  - null
60
  - - study_name
config.yml CHANGED
@@ -18,7 +18,7 @@
18
  - - learning_starts
19
  - 100000
20
  - - n_timesteps
21
- - 1000000.0
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
 
18
  - - learning_starts
19
  - 100000
20
  - - n_timesteps
21
+ - 2000000.0
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
dqn-SpaceInvadersNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:58849367ce33c0ee05c95a69bf598c42e7172bc6a7755279e4b6f455e891dc58
3
  size 27224823
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88892c14612c009220b513da79a6cd0a60e7f5ee8306677e2b539ab2be1d8448
3
  size 27224823
dqn-SpaceInvadersNoFrameskip-v4/data CHANGED
The diff for this file is too large to render. See raw diff
 
dqn-SpaceInvadersNoFrameskip-v4/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:659f6744548925cc9ed1f9a71af1a379627e01c40e0a6a7c2c3c69b891bf8030
3
  size 13505739
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8cc2aed46c9a12c501eafc302c2c6ecc896e1cab81e3018a41743c28854d091
3
  size 13505739
dqn-SpaceInvadersNoFrameskip-v4/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9c9b0a91771842fb827bb01811435980ba5431c6ac444e6f6cd25fb74d68292d
3
  size 13504937
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba0c0d9a2d7c13326ce6fdb29f1e4b0469bff6ba8c297383ed56f0471dfe8933
3
  size 13504937
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ac49751338152b5dc1577d4ce2bfb5e3805da8281b07a850af624ad23cb1655f
3
- size 211542
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9009e502c97ddcf1f060c6c11cc4eae273420633c47cd2d14305e023e0d7465d
3
+ size 265067
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 498.5, "std_reward": 100.10119879402045, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-01-17T04:52:28.761363"}
 
1
+ {"mean_reward": 539.0, "std_reward": 147.94931564559533, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-01-17T09:00:20.942649"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:068a6041504c889ae8f236cb2a6d22e97a91566f6318e373a67ad0443fbe75d4
3
- size 36506
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca776e81d0bdfcf938a5a7a43b7b4b37fdd7c4a389fd49d9a1814bdcfe290be9
3
+ size 62319