Upload . with huggingface_hub
Browse files- .DS_Store +0 -0
- .gitattributes +1 -0
- README.md +23 -0
- backup_models/best_reinforce_lunar_lander_cont_model_247.147.pt +3 -0
- backup_models/best_reinforce_lunar_lander_cont_model_248.915.pt +3 -0
- backup_models/best_reinforce_lunar_lander_cont_model_249.478.pt +3 -0
- backup_models/best_reinforce_lunar_lander_cont_model_251.64.pt +3 -0
- backup_models/best_reinforce_lunar_lander_cont_model_252.499.pt +3 -0
- backup_models/best_reinforce_lunar_lander_cont_model_253.295.pt +3 -0
- backup_models/best_reinforce_lunar_lander_cont_model_256.824.pt +3 -0
- backup_models/best_reinforce_lunar_lander_cont_model_259.457.pt +3 -0
- backup_models/best_reinforce_lunar_lander_cont_model_263.751.pt +3 -0
- backup_models/best_reinforce_lunar_lander_cont_model_264.418.pt +3 -0
- backup_models/best_reinforce_lunar_lander_cont_model_265.261.pt +3 -0
- backup_models/best_reinforce_lunar_lander_cont_model_265.679.pt +3 -0
- backup_models/best_reinforce_lunar_lander_cont_model_266.437.pt +3 -0
- backup_models/best_reinforce_lunar_lander_cont_model_266.728.pt +3 -0
- backup_models/best_reinforce_lunar_lander_cont_model_267.386.pt +3 -0
- backup_models/best_reinforce_lunar_lander_cont_model_268.143.pt +3 -0
- backup_models/best_reinforce_lunar_lander_cont_model_269.185.pt +3 -0
- backup_models/best_reinforce_lunar_lander_cont_model_270.574.pt +3 -0
- backup_models/best_reinforce_lunar_lander_cont_model_270.846.pt +3 -0
- backup_models/best_reinforce_lunar_lander_cont_model_272.109.pt +3 -0
- backup_models/best_reinforce_lunar_lander_cont_model_288.627.pt +3 -0
- backup_models/best_reinforce_lunar_lander_cont_model_292.715.pt +3 -0
- backup_models/best_reinforce_lunar_lander_cont_model_298.926.pt +3 -0
- backup_models/best_reinforce_lunar_lander_cont_model_304.476.pt +3 -0
- backup_models/best_reinforce_lunar_lander_cont_model_308.668.pt +3 -0
- backup_models/best_reinforce_lunar_lander_cont_model_312.28.pt +3 -0
- backup_models/best_reinforce_lunar_lander_cont_model_318.721.pt +3 -0
- best_reinforce_lunar_lander_cont_model_269.402.pt +3 -0
- hyperparameters.json +1 -0
- replay.mp4 +3 -0
.DS_Store
ADDED
Binary file (6.15 kB). View file
|
|
.gitattributes
CHANGED
@@ -32,3 +32,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
32 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
33 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
34 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
32 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
33 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
34 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
35 |
+
replay.mp4 filter=lfs diff=lfs merge=lfs -text
|
README.md
ADDED
@@ -0,0 +1,23 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
tags:
|
3 |
+
- LunarLanderContinuous-v2
|
4 |
+
- reinforce
|
5 |
+
- reinforcement-learning
|
6 |
+
- custom-implementation
|
7 |
+
model-index:
|
8 |
+
- name: REINFORCE-LunarLanderContinuous-v2
|
9 |
+
results:
|
10 |
+
- task:
|
11 |
+
type: reinforcement-learning
|
12 |
+
name: reinforcement-learning
|
13 |
+
dataset:
|
14 |
+
name: LunarLanderContinuous-v2
|
15 |
+
type: LunarLanderContinuous-v2
|
16 |
+
metrics:
|
17 |
+
- type: mean_reward
|
18 |
+
value: 264.10 +/- 37.17
|
19 |
+
name: mean_reward
|
20 |
+
verified: false
|
21 |
+
---
|
22 |
+
|
23 |
+
# **Reinforce** Agent playing **LunarLanderContinuous-v2**
|
backup_models/best_reinforce_lunar_lander_cont_model_247.147.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6606809113411e5dd688f3e212b765fa88c72a0ba0d599c34605dac1fcf34c59
|
3 |
+
size 148437
|
backup_models/best_reinforce_lunar_lander_cont_model_248.915.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:20f9e0865ba8e1464a8a8e80497ab7f14f9d00c49e67f0947804e0ea4cbcb794
|
3 |
+
size 148437
|
backup_models/best_reinforce_lunar_lander_cont_model_249.478.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67918301a712c65392e29145c715677fd5434980acddfc59fe0be85bb9d3d9f3
|
3 |
+
size 147413
|
backup_models/best_reinforce_lunar_lander_cont_model_251.64.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d498c5e8f25f1dd1c8bbae1870c9f1063b5fb94acc9fc18b30884a0bf68607a4
|
3 |
+
size 148427
|
backup_models/best_reinforce_lunar_lander_cont_model_252.499.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1255bc9f11e11bd2ef050a220403729f1b0a32acc4fe2463d824811af2e21235
|
3 |
+
size 148437
|
backup_models/best_reinforce_lunar_lander_cont_model_253.295.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d6b43d91bfa7fdde05dfea8396fc376bbebcbf4313c4bc5e357caa5e502af1fd
|
3 |
+
size 148437
|
backup_models/best_reinforce_lunar_lander_cont_model_256.824.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8fa87fb4d758c8c8dad036b0cd06b656c07f09e31dc3698cf7e33119352ea5a5
|
3 |
+
size 147413
|
backup_models/best_reinforce_lunar_lander_cont_model_259.457.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:53de582565aaf5f6723cd8c7481e4981d558e1c663325329aa879a3e76a52ea9
|
3 |
+
size 148437
|
backup_models/best_reinforce_lunar_lander_cont_model_263.751.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5c08bf0c5f8445217599023a59b3bf606b144fdff68113d7acc81dd8580f5469
|
3 |
+
size 148437
|
backup_models/best_reinforce_lunar_lander_cont_model_264.418.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7e899524dd1a45926f1087b9bd0518fdfa1f42b413afb013471fc3a062d60333
|
3 |
+
size 148437
|
backup_models/best_reinforce_lunar_lander_cont_model_265.261.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:180f85f80e4d4372b1bde095c94c910a148067183256cf2b56c1c881ca482147
|
3 |
+
size 148437
|
backup_models/best_reinforce_lunar_lander_cont_model_265.679.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa4a43636e2789716f2b3cc05b4e871fb624ebb2c71d0de06b9c9434bf555011
|
3 |
+
size 148437
|
backup_models/best_reinforce_lunar_lander_cont_model_266.437.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:29ed4892715e91f95bccfa6cd3a2d6fc3790d74f2c440ced9555b9eb3e8482ba
|
3 |
+
size 148437
|
backup_models/best_reinforce_lunar_lander_cont_model_266.728.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6af677a52ae46a7b3f59df10a753e0fb0c4275ee41ed63d1f1447f82ea211bd7
|
3 |
+
size 148437
|
backup_models/best_reinforce_lunar_lander_cont_model_267.386.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:64fda45fbaafd4372d14159c7e84b54db0a51d2e796d687a1b15920c9976850f
|
3 |
+
size 148437
|
backup_models/best_reinforce_lunar_lander_cont_model_268.143.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2573a74611e537f5859ef8f6f53c9d0d9337cf6e5b54fbeda8a0133fc94f3932
|
3 |
+
size 148437
|
backup_models/best_reinforce_lunar_lander_cont_model_269.185.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8d75450f4debc5b38ac0e37369655c22385a17a921dada21bbcc9fa684b1b4c7
|
3 |
+
size 148437
|
backup_models/best_reinforce_lunar_lander_cont_model_270.574.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c5096b7647cf2989f98429df15f5a4ee3ff6aaed91b3bf029c68ebb33dca9f04
|
3 |
+
size 148437
|
backup_models/best_reinforce_lunar_lander_cont_model_270.846.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6b12c532b218b3a217b8e2de59a61db1620980cd6c8e05fb662414542a70bb8b
|
3 |
+
size 148437
|
backup_models/best_reinforce_lunar_lander_cont_model_272.109.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c1566642308bbdeafecf5b311b7f6f0ac3a44c35f040da892ebc27a9cd1a515
|
3 |
+
size 148437
|
backup_models/best_reinforce_lunar_lander_cont_model_288.627.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:763de0f7e5862e2b5282bc07848ff5a07f14ea25552ca4fd9e8ad79118e80b47
|
3 |
+
size 147413
|
backup_models/best_reinforce_lunar_lander_cont_model_292.715.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f7d15eaee786b01b9b5d5d5a9933003374d58dc699a7cbc0b87241dbcd6e2631
|
3 |
+
size 147413
|
backup_models/best_reinforce_lunar_lander_cont_model_298.926.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b24afbeaa24168aead1933a9cd8047170d78f182f92772a38c536e30aad13b5f
|
3 |
+
size 147413
|
backup_models/best_reinforce_lunar_lander_cont_model_304.476.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7c040f5b236cb551d9c5a0aefda7cf21ffb82cd9300de7fdba5a3a19aa6738f
|
3 |
+
size 147413
|
backup_models/best_reinforce_lunar_lander_cont_model_308.668.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5a7edde23bac7531bb5316b90048c3cc0bdb21aa34225b2761d8ccf51d388652
|
3 |
+
size 147413
|
backup_models/best_reinforce_lunar_lander_cont_model_312.28.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:446ae0ea02b919bf0b658d2e745aeedd60b0c70eb8b2665b120cfbce0e3faea5
|
3 |
+
size 147403
|
backup_models/best_reinforce_lunar_lander_cont_model_318.721.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:99bc767ab3f4a537ed5f7ffa2ec45f2a70d65967aceb0ae3f20f4ae11dec4527
|
3 |
+
size 147413
|
best_reinforce_lunar_lander_cont_model_269.402.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4e659b3cfdeb543a374d69fe7555626c9ff93bdc4dcb14c0c85d2d257e636683
|
3 |
+
size 148437
|
hyperparameters.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"env_id": "LunarLanderContinuous-v2", "mean_reward": 264.103, "n_evaluation_episodes": 900, "eval_datetime": "2023-01-17T15:13:05.144129"}
|
replay.mp4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eb10f4136d2ecfbb0774b97b5723e91aa504c3e41816dd263ccd9e320f553bed
|
3 |
+
size 1039270
|