Diogo-V commited on
Commit
900f800
1 Parent(s): d242b6e

Adding more results

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. params/phi/5/ones_t/comb_12/init/lm_head/_0.pt +3 -0
  2. params/phi/5/ones_t/comb_12/init/lm_head/_s.pt +3 -0
  3. params/phi/5/ones_t/comb_12/init/model.layers.0.mlp.fc1/_0.pt +3 -0
  4. params/phi/5/ones_t/comb_12/init/model.layers.0.mlp.fc1/_s.pt +3 -0
  5. params/phi/5/ones_t/comb_12/init/model.layers.0.mlp.fc2/_0.pt +3 -0
  6. params/phi/5/ones_t/comb_12/init/model.layers.0.mlp.fc2/_s.pt +3 -0
  7. params/phi/5/ones_t/comb_12/init/model.layers.0.self_attn.dense/_0.pt +3 -0
  8. params/phi/5/ones_t/comb_12/init/model.layers.0.self_attn.dense/_s.pt +3 -0
  9. params/phi/5/ones_t/comb_12/init/model.layers.0.self_attn.k_proj/_0.pt +3 -0
  10. params/phi/5/ones_t/comb_12/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
  11. params/phi/5/ones_t/comb_12/init/model.layers.0.self_attn.q_proj/_0.pt +3 -0
  12. params/phi/5/ones_t/comb_12/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
  13. params/phi/5/ones_t/comb_12/init/model.layers.0.self_attn.v_proj/_0.pt +3 -0
  14. params/phi/5/ones_t/comb_12/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
  15. params/phi/5/ones_t/comb_12/init/model.layers.1.mlp.fc1/_0.pt +3 -0
  16. params/phi/5/ones_t/comb_12/init/model.layers.1.mlp.fc1/_s.pt +3 -0
  17. params/phi/5/ones_t/comb_12/init/model.layers.1.mlp.fc2/_0.pt +3 -0
  18. params/phi/5/ones_t/comb_12/init/model.layers.1.mlp.fc2/_s.pt +3 -0
  19. params/phi/5/ones_t/comb_12/init/model.layers.1.self_attn.dense/_0.pt +3 -0
  20. params/phi/5/ones_t/comb_12/init/model.layers.1.self_attn.dense/_s.pt +3 -0
  21. params/phi/5/ones_t/comb_12/init/model.layers.1.self_attn.k_proj/_0.pt +3 -0
  22. params/phi/5/ones_t/comb_12/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
  23. params/phi/5/ones_t/comb_12/init/model.layers.1.self_attn.q_proj/_0.pt +3 -0
  24. params/phi/5/ones_t/comb_12/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
  25. params/phi/5/ones_t/comb_12/init/model.layers.1.self_attn.v_proj/_0.pt +3 -0
  26. params/phi/5/ones_t/comb_12/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
  27. params/phi/5/ones_t/comb_12/init/model.layers.10.mlp.fc1/_0.pt +3 -0
  28. params/phi/5/ones_t/comb_12/init/model.layers.10.mlp.fc1/_s.pt +3 -0
  29. params/phi/5/ones_t/comb_12/init/model.layers.10.mlp.fc2/_0.pt +3 -0
  30. params/phi/5/ones_t/comb_12/init/model.layers.10.mlp.fc2/_s.pt +3 -0
  31. params/phi/5/ones_t/comb_12/init/model.layers.10.self_attn.dense/_0.pt +3 -0
  32. params/phi/5/ones_t/comb_12/init/model.layers.10.self_attn.dense/_s.pt +3 -0
  33. params/phi/5/ones_t/comb_12/init/model.layers.10.self_attn.k_proj/_0.pt +3 -0
  34. params/phi/5/ones_t/comb_12/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
  35. params/phi/5/ones_t/comb_12/init/model.layers.10.self_attn.q_proj/_0.pt +3 -0
  36. params/phi/5/ones_t/comb_12/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
  37. params/phi/5/ones_t/comb_12/init/model.layers.10.self_attn.v_proj/_0.pt +3 -0
  38. params/phi/5/ones_t/comb_12/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
  39. params/phi/5/ones_t/comb_12/init/model.layers.11.mlp.fc1/_0.pt +3 -0
  40. params/phi/5/ones_t/comb_12/init/model.layers.11.mlp.fc1/_s.pt +3 -0
  41. params/phi/5/ones_t/comb_12/init/model.layers.11.mlp.fc2/_0.pt +3 -0
  42. params/phi/5/ones_t/comb_12/init/model.layers.11.mlp.fc2/_s.pt +3 -0
  43. params/phi/5/ones_t/comb_12/init/model.layers.11.self_attn.dense/_0.pt +3 -0
  44. params/phi/5/ones_t/comb_12/init/model.layers.11.self_attn.dense/_s.pt +3 -0
  45. params/phi/5/ones_t/comb_12/init/model.layers.11.self_attn.k_proj/_0.pt +3 -0
  46. params/phi/5/ones_t/comb_12/init/model.layers.11.self_attn.k_proj/_s.pt +3 -0
  47. params/phi/5/ones_t/comb_12/init/model.layers.11.self_attn.q_proj/_0.pt +3 -0
  48. params/phi/5/ones_t/comb_12/init/model.layers.11.self_attn.q_proj/_s.pt +3 -0
  49. params/phi/5/ones_t/comb_12/init/model.layers.11.self_attn.v_proj/_0.pt +3 -0
  50. params/phi/5/ones_t/comb_12/init/model.layers.11.self_attn.v_proj/_s.pt +3 -0
params/phi/5/ones_t/comb_12/init/lm_head/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84c29e156c1ff233ab1d70419ed039b29645b55825ad507a9e5af986fd4ceae9
3
+ size 205955
params/phi/5/ones_t/comb_12/init/lm_head/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:397d38c6da4509e14d765f0248c85f16263697f14f755563c0dd9e5a5a6266e8
3
+ size 205955
params/phi/5/ones_t/comb_12/init/model.layers.0.mlp.fc1/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
3
+ size 42115
params/phi/5/ones_t/comb_12/init/model.layers.0.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0dd77acfb6489f1266888714e98b7325cb8fe3294efe883d5d7ebecd65fa06d
3
+ size 42115
params/phi/5/ones_t/comb_12/init/model.layers.0.mlp.fc2/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.0.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84aa9426450d2cd78435a85231111c760184e24f26bd4f38c57c7cd270073193
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.0.self_attn.dense/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.0.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65737e5b1a9d55ae2a38539fce368987f0d6c3c7714cb4221d631553844bbc5f
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.0.self_attn.k_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.0.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17093f4f443982aeff5805ce69e396c0d817085b022f126c549552ba236cb9bb
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.0.self_attn.q_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.0.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aab34b13a281429af2c8cad603546a4e1159d14b769ceeaf679dcb8b01eb1578
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.0.self_attn.v_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.0.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f8f2f0ee6c5d4c2b7202e2e7298a6352e90a70ea06c0bddddc6974ff613b2af
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.1.mlp.fc1/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
3
+ size 42115
params/phi/5/ones_t/comb_12/init/model.layers.1.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ceefee8d0170904dc9906b6815b923fbefdff289c3d2ae55746d1936eff65e1b
3
+ size 42115
params/phi/5/ones_t/comb_12/init/model.layers.1.mlp.fc2/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.1.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:691cbd0269444adc5bf5aef398559bc5fe630247d28c0a96ad3c4fea96bf0de6
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.1.self_attn.dense/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.1.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35f54ac8c11db853353f28f03a237afe4a12db3739db729b69f53aa26b216f79
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.1.self_attn.k_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.1.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ff4a9f00e0f61a2cbea0f804cfef16aa04b953095cea78a40d27f9a8b83304f
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.1.self_attn.q_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.1.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ddc76536e769f6f8891c8e45af78a6a29c74b30d486b7c433e35fa99e218c049
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.1.self_attn.v_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.1.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f8954484212def279589d571c29687a54529540124566b3939d3faa6c4799bb
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.10.mlp.fc1/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
3
+ size 42115
params/phi/5/ones_t/comb_12/init/model.layers.10.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c2344ece6c3db5e448d72c300297b5ab264311018bc506bec90ee0110b7ea9f
3
+ size 42115
params/phi/5/ones_t/comb_12/init/model.layers.10.mlp.fc2/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.10.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d97291d1c9677f602569b2c431bf7629d1ec53b46043a007cf151da4e72b80d
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.10.self_attn.dense/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.10.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dbd41f17453ada72c58c8d6029b256ff0809cb0836c48bf479d0917da9b679cf
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.10.self_attn.k_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.10.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b180ceca580314fa6b3ca28fdb8728ef86f92b285fb12cdb115a6072215fc3a2
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.10.self_attn.q_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.10.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e266a5699bd4ef314f1ce619f68dcc4076c7f38a14e12e873b42ba9f3b7a0193
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.10.self_attn.v_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.10.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76c7624835fc3f33f8f00484eefc8b410f6349f35982cb8f5d5937c6a48ce4ec
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.11.mlp.fc1/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
3
+ size 42115
params/phi/5/ones_t/comb_12/init/model.layers.11.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:345e216724f00f21e882a5cb6ba442a3dd762414e86a368beb36ce0b9eb5ad89
3
+ size 42115
params/phi/5/ones_t/comb_12/init/model.layers.11.mlp.fc2/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.11.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ebda415a73027bb35f951589b449dbbec46512b474b10e394876ecb96cffc4a
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.11.self_attn.dense/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.11.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:87826aacb7050bdde6dfd40ebac49a8e732a808403f3e8670d84af1a314195f5
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.11.self_attn.k_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.11.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20742b3811b73e52a0987bbac53fc38ce21686f97dcef7c47d53b18b09f0735d
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.11.self_attn.q_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.11.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c043fc692c383944e55db185b06ee19e63aed9cd417abd2bce3fc73b945d217
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.11.self_attn.v_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/5/ones_t/comb_12/init/model.layers.11.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f30f54123bf2f8fb890777ed2422903c958f98abf209882ac028984690f53d0f
3
+ size 11395