Adding more results
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- params/phi/5/rnd_search_t_no_sched/comb_0/init/lm_head/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/lm_head/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc1/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc1/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc2/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc2/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.dense/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.dense/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.k_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.q_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.v_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc1/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc1/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc2/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc2/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.dense/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.dense/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.k_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.q_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.v_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc1/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc1/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc2/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc2/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.dense/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.dense/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.k_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.q_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.v_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc1/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc1/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc2/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc2/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.dense/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.dense/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.k_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.k_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.q_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.q_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.v_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.v_proj/_s.pt +3 -0
params/phi/5/rnd_search_t_no_sched/comb_0/init/lm_head/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bbbf5a3236b4bda67cbd5696c4e48ce96ff163b3ba4fab9cf60ba6dd60dbdce3
|
3 |
+
size 205955
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/lm_head/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:62b6ca4022b00270f4b7cc4f6cbf46607debb5a8cc850127f3362a8ee342f4b0
|
3 |
+
size 205955
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ff14abff21a59681555f1ed7098ab37cb081d9e9d2801abfa7e7ecba33eafe3b
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5df401f0abeef4700f95836a2826807e0510e8f2a723d5b7869d3a6735340ba8
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd4ef4f14ba111dca382184af30a2851f51e3644d48296a31c3ebb0835dc7db2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d589740718c954d5552920fda20eaf65fb90e65fca4a79ca4be45d78528a2579
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0fa168a597f63636a56ea2f0edd57abaf35f8472755f575c77410f748065fe84
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d589740718c954d5552920fda20eaf65fb90e65fca4a79ca4be45d78528a2579
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c36711ddb8ffcbe856fc570f4a7842b814902bfd59ffb3f4ae1d0573b8904d59
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d589740718c954d5552920fda20eaf65fb90e65fca4a79ca4be45d78528a2579
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea2c844d9a26ef9fab6e30fcb1a192f5c9347b25c2aade1728fd881804920a6f
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d589740718c954d5552920fda20eaf65fb90e65fca4a79ca4be45d78528a2579
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aa5bba8365e583e56cb2ed060cc5a5beea9cb7e5de2579c9307f7ab01dca2fe
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d589740718c954d5552920fda20eaf65fb90e65fca4a79ca4be45d78528a2579
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:db331814f3d810d9877bc3f978e6d060553f4693d01dd8c022f5b334723f5047
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5df401f0abeef4700f95836a2826807e0510e8f2a723d5b7869d3a6735340ba8
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:19b06c6fca1a324d59a74a26d840d50ea65a4b80b39c33d37b30021d49e4d6f0
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d589740718c954d5552920fda20eaf65fb90e65fca4a79ca4be45d78528a2579
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a53e9b2c5260df99c4ccc02318eb0985e1cfebeee2555cf5bea34549bdc1901d
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d589740718c954d5552920fda20eaf65fb90e65fca4a79ca4be45d78528a2579
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:379236f52f010743759ca65973b563a0e3025e8e9e522753fd3f0d17768edcad
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d589740718c954d5552920fda20eaf65fb90e65fca4a79ca4be45d78528a2579
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:97e7f56e76ce57ca47406c98f18ae50e221ea0cbe7c15b02c3e9197eb1aeab52
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d589740718c954d5552920fda20eaf65fb90e65fca4a79ca4be45d78528a2579
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bf4fe0789de715d1cf7c10b80e4ac689133cfeb1f21266be604fc02ebbcfc34f
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d589740718c954d5552920fda20eaf65fb90e65fca4a79ca4be45d78528a2579
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e651a97459695ce3958464842cb249d9576ac54cb8d34f73bd61de655823f377
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5df401f0abeef4700f95836a2826807e0510e8f2a723d5b7869d3a6735340ba8
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fe112af28ef27f24168f11a225db242ab244f365277174c0bc0d7a5b0adef526
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d589740718c954d5552920fda20eaf65fb90e65fca4a79ca4be45d78528a2579
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1e0013620db1d3febab14e98929228e939c49ef7b0efada31f5f875ff65f108b
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d589740718c954d5552920fda20eaf65fb90e65fca4a79ca4be45d78528a2579
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9247895ff07ca0ab600d834c0c12d3693f724500feabb984848689580b0c5205
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d589740718c954d5552920fda20eaf65fb90e65fca4a79ca4be45d78528a2579
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aeb881515bc6d8145acb112c12e535ac0b5a6f07b56a71a3c41c5f961a9aae92
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d589740718c954d5552920fda20eaf65fb90e65fca4a79ca4be45d78528a2579
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e21ffc3af24d6eb387f8ce5f35636fa72aac170a288e4ee6de58ed2b6dd0b03
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d589740718c954d5552920fda20eaf65fb90e65fca4a79ca4be45d78528a2579
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9e4f1198c96d8173dde4c52025aa9b0938417a6af2364c828157b8494c79fd9f
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5df401f0abeef4700f95836a2826807e0510e8f2a723d5b7869d3a6735340ba8
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3d07e9b05c9ef5840cd36220c3ec8a45697b7993ea73d3e728a12330b7f8899
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d589740718c954d5552920fda20eaf65fb90e65fca4a79ca4be45d78528a2579
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:462e7b94de3172f1557502cdbe92b8723f24c58b4dc559fcedeb3e851ba4a3a0
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d589740718c954d5552920fda20eaf65fb90e65fca4a79ca4be45d78528a2579
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a240e69e3242a62ee703b0f4fc9716769a52ce420630bfaa0c16b92f1292ce8a
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d589740718c954d5552920fda20eaf65fb90e65fca4a79ca4be45d78528a2579
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:07d2298e3460edccff702e9c0e5bdd446a7dace8ed36aed9247b3c2a9da023e6
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d589740718c954d5552920fda20eaf65fb90e65fca4a79ca4be45d78528a2579
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:58ef7c2fb017a42b7e5518fa74cac0a31d967182b1d379ecb1a45193de1c09f8
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d589740718c954d5552920fda20eaf65fb90e65fca4a79ca4be45d78528a2579
|
3 |
+
size 11395
|