Diogo-V commited on
Commit
93c174d
·
verified ·
1 Parent(s): a5ad842

Adding more results

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. params/phi/8/ones_t/comb_2/init/lm_head/_0.pt +3 -0
  2. params/phi/8/ones_t/comb_2/init/lm_head/_s.pt +3 -0
  3. params/phi/8/ones_t/comb_2/init/model.layers.0.mlp.fc1/_0.pt +3 -0
  4. params/phi/8/ones_t/comb_2/init/model.layers.0.mlp.fc1/_s.pt +3 -0
  5. params/phi/8/ones_t/comb_2/init/model.layers.0.mlp.fc2/_0.pt +3 -0
  6. params/phi/8/ones_t/comb_2/init/model.layers.0.mlp.fc2/_s.pt +3 -0
  7. params/phi/8/ones_t/comb_2/init/model.layers.0.self_attn.dense/_0.pt +3 -0
  8. params/phi/8/ones_t/comb_2/init/model.layers.0.self_attn.dense/_s.pt +3 -0
  9. params/phi/8/ones_t/comb_2/init/model.layers.0.self_attn.k_proj/_0.pt +3 -0
  10. params/phi/8/ones_t/comb_2/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
  11. params/phi/8/ones_t/comb_2/init/model.layers.0.self_attn.q_proj/_0.pt +3 -0
  12. params/phi/8/ones_t/comb_2/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
  13. params/phi/8/ones_t/comb_2/init/model.layers.0.self_attn.v_proj/_0.pt +3 -0
  14. params/phi/8/ones_t/comb_2/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
  15. params/phi/8/ones_t/comb_2/init/model.layers.1.mlp.fc1/_0.pt +3 -0
  16. params/phi/8/ones_t/comb_2/init/model.layers.1.mlp.fc1/_s.pt +3 -0
  17. params/phi/8/ones_t/comb_2/init/model.layers.1.mlp.fc2/_0.pt +3 -0
  18. params/phi/8/ones_t/comb_2/init/model.layers.1.mlp.fc2/_s.pt +3 -0
  19. params/phi/8/ones_t/comb_2/init/model.layers.1.self_attn.dense/_0.pt +3 -0
  20. params/phi/8/ones_t/comb_2/init/model.layers.1.self_attn.dense/_s.pt +3 -0
  21. params/phi/8/ones_t/comb_2/init/model.layers.1.self_attn.k_proj/_0.pt +3 -0
  22. params/phi/8/ones_t/comb_2/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
  23. params/phi/8/ones_t/comb_2/init/model.layers.1.self_attn.q_proj/_0.pt +3 -0
  24. params/phi/8/ones_t/comb_2/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
  25. params/phi/8/ones_t/comb_2/init/model.layers.1.self_attn.v_proj/_0.pt +3 -0
  26. params/phi/8/ones_t/comb_2/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
  27. params/phi/8/ones_t/comb_2/init/model.layers.10.mlp.fc1/_0.pt +3 -0
  28. params/phi/8/ones_t/comb_2/init/model.layers.10.mlp.fc1/_s.pt +3 -0
  29. params/phi/8/ones_t/comb_2/init/model.layers.10.mlp.fc2/_0.pt +3 -0
  30. params/phi/8/ones_t/comb_2/init/model.layers.10.mlp.fc2/_s.pt +3 -0
  31. params/phi/8/ones_t/comb_2/init/model.layers.10.self_attn.dense/_0.pt +3 -0
  32. params/phi/8/ones_t/comb_2/init/model.layers.10.self_attn.dense/_s.pt +3 -0
  33. params/phi/8/ones_t/comb_2/init/model.layers.10.self_attn.k_proj/_0.pt +3 -0
  34. params/phi/8/ones_t/comb_2/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
  35. params/phi/8/ones_t/comb_2/init/model.layers.10.self_attn.q_proj/_0.pt +3 -0
  36. params/phi/8/ones_t/comb_2/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
  37. params/phi/8/ones_t/comb_2/init/model.layers.10.self_attn.v_proj/_0.pt +3 -0
  38. params/phi/8/ones_t/comb_2/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
  39. params/phi/8/ones_t/comb_2/init/model.layers.11.mlp.fc1/_0.pt +3 -0
  40. params/phi/8/ones_t/comb_2/init/model.layers.11.mlp.fc1/_s.pt +3 -0
  41. params/phi/8/ones_t/comb_2/init/model.layers.11.mlp.fc2/_0.pt +3 -0
  42. params/phi/8/ones_t/comb_2/init/model.layers.11.mlp.fc2/_s.pt +3 -0
  43. params/phi/8/ones_t/comb_2/init/model.layers.11.self_attn.dense/_0.pt +3 -0
  44. params/phi/8/ones_t/comb_2/init/model.layers.11.self_attn.dense/_s.pt +3 -0
  45. params/phi/8/ones_t/comb_2/init/model.layers.11.self_attn.k_proj/_0.pt +3 -0
  46. params/phi/8/ones_t/comb_2/init/model.layers.11.self_attn.k_proj/_s.pt +3 -0
  47. params/phi/8/ones_t/comb_2/init/model.layers.11.self_attn.q_proj/_0.pt +3 -0
  48. params/phi/8/ones_t/comb_2/init/model.layers.11.self_attn.q_proj/_s.pt +3 -0
  49. params/phi/8/ones_t/comb_2/init/model.layers.11.self_attn.v_proj/_0.pt +3 -0
  50. params/phi/8/ones_t/comb_2/init/model.layers.11.self_attn.v_proj/_s.pt +3 -0
params/phi/8/ones_t/comb_2/init/lm_head/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84c29e156c1ff233ab1d70419ed039b29645b55825ad507a9e5af986fd4ceae9
3
+ size 205955
params/phi/8/ones_t/comb_2/init/lm_head/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a58194e28d6554db10edb6ff5e0f5537f1c4eb7fa9c9faada7e302ab91ac9c40
3
+ size 205955
params/phi/8/ones_t/comb_2/init/model.layers.0.mlp.fc1/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
3
+ size 42115
params/phi/8/ones_t/comb_2/init/model.layers.0.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65
3
+ size 42115
params/phi/8/ones_t/comb_2/init/model.layers.0.mlp.fc2/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.0.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.0.self_attn.dense/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.0.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.0.self_attn.k_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.0.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.0.self_attn.q_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.0.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cfe0685560234c3522077f77fa8cfe5f577af8e205525916b2973b268cbed072
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.0.self_attn.v_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.0.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.1.mlp.fc1/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
3
+ size 42115
params/phi/8/ones_t/comb_2/init/model.layers.1.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65
3
+ size 42115
params/phi/8/ones_t/comb_2/init/model.layers.1.mlp.fc2/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.1.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.1.self_attn.dense/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.1.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.1.self_attn.k_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.1.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.1.self_attn.q_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.1.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.1.self_attn.v_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.1.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.10.mlp.fc1/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
3
+ size 42115
params/phi/8/ones_t/comb_2/init/model.layers.10.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65
3
+ size 42115
params/phi/8/ones_t/comb_2/init/model.layers.10.mlp.fc2/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.10.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.10.self_attn.dense/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.10.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.10.self_attn.k_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.10.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.10.self_attn.q_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.10.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.10.self_attn.v_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.10.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.11.mlp.fc1/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
3
+ size 42115
params/phi/8/ones_t/comb_2/init/model.layers.11.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65
3
+ size 42115
params/phi/8/ones_t/comb_2/init/model.layers.11.mlp.fc2/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.11.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.11.self_attn.dense/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.11.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.11.self_attn.k_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.11.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.11.self_attn.q_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.11.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.11.self_attn.v_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_2/init/model.layers.11.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35
3
+ size 11395