Diogo-V commited on
Commit
6ec2865
1 Parent(s): 0a4c96f

Adding more results

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. params/phi/4/rnd_search_t_no_sched/comb_18/init/lm_head/_s.pt +3 -0
  2. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc1/_s.pt +3 -0
  3. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc2/_s.pt +3 -0
  4. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.dense/_s.pt +3 -0
  5. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
  6. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
  7. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
  8. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc1/_s.pt +3 -0
  9. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc2/_s.pt +3 -0
  10. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.dense/_s.pt +3 -0
  11. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
  12. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
  13. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
  14. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc1/_s.pt +3 -0
  15. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc2/_s.pt +3 -0
  16. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.dense/_s.pt +3 -0
  17. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
  18. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
  19. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
  20. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc1/_s.pt +3 -0
  21. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc2/_s.pt +3 -0
  22. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.dense/_s.pt +3 -0
  23. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.k_proj/_s.pt +3 -0
  24. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.q_proj/_s.pt +3 -0
  25. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.v_proj/_s.pt +3 -0
  26. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc1/_s.pt +3 -0
  27. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc2/_s.pt +3 -0
  28. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.dense/_s.pt +3 -0
  29. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.k_proj/_s.pt +3 -0
  30. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.q_proj/_s.pt +3 -0
  31. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.v_proj/_s.pt +3 -0
  32. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc1/_s.pt +3 -0
  33. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc2/_s.pt +3 -0
  34. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.dense/_s.pt +3 -0
  35. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.k_proj/_s.pt +3 -0
  36. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.q_proj/_s.pt +3 -0
  37. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.v_proj/_s.pt +3 -0
  38. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc1/_s.pt +3 -0
  39. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc2/_s.pt +3 -0
  40. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.dense/_s.pt +3 -0
  41. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.k_proj/_s.pt +3 -0
  42. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.q_proj/_s.pt +3 -0
  43. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.v_proj/_s.pt +3 -0
  44. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc1/_s.pt +3 -0
  45. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc2/_s.pt +3 -0
  46. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.dense/_s.pt +3 -0
  47. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.k_proj/_s.pt +3 -0
  48. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.q_proj/_s.pt +3 -0
  49. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.v_proj/_s.pt +3 -0
  50. params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.16.mlp.fc1/_s.pt +3 -0
params/phi/4/rnd_search_t_no_sched/comb_18/init/lm_head/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51c11ffa139f77bca740c212a2298c0e5fdfe1b9394cfd352de013fbf56d6bf5
3
+ size 205955
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb805f947113f00b22822a99b43c46eec6bae18b0220696cb4cc4df6da44200e
3
+ size 42115
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:075949d700797a1158594778650381b933bf2a4de5553afbb9a69f224056ace7
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1255b476389a23dc6c7eb650f83753ae92acd69eaefae4005198debe409bc857
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2aab51b6beb5caff267c772b27514bde4c8ea150c56aa4220aecd8a7e8b3c536
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13105c640a58ff07b260ceba6507d64a8363f949dff3131434179129a884c246
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40f53147761badd3cad324b505d5e6b58a6edd94d2b370c4cd0257f1731a6168
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ed1e49494b3688a11ca6f0b83ec7d3271941a6c7b2d60aac48cbe7df1cce08b
3
+ size 42115
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a8ddc4e59cac74bc658fe17b57039258829df64ef32a1c6eda907ec3015d03c
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d5d22bbdd9bafb6a4169f8937ba21d500072fd2cc2b647ec34c880e69390672
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4dfa40fb99152219952d44562574af17c3dd625bfc3d3a2050e9e7bf58460470
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98a349b794e1e78c303fa4676e3d1116aa3743f57c88cacc341cc1b2417d9e10
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8da6720a87c5359e9ada9fb8c0a8038b1f9cd9f120b8cd6ad7af6ee2b184997
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45125d4b1998dcb15d9278b27bc37e325628afcad2d8de0acc422009beb99bb3
3
+ size 42115
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:086e0d187f38b1fad2a94a92656ef45e031607b7cd9c5ed5727978defda06e7c
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:927f3973ae3bbd9672f58c6e6656d5e098d8c4b29fd7556b3c2491ad8a3c950a
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8eef33c1565532bbc77282cb482c58051fc7e8c8b8a424076e1fddd3b4f95b5a
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd82d3da9be519209a0b6049379dcbdaf9fda24ec39092ded652faf956321313
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0b862e0ad89e1f19a7006148040f7ad988ffc6bf25fdc4b18c0319d76a71bdf
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85f31ebd41c2450a64e25fdc5db2e5acdcfc8fa60c61c60ed80faa9aa4dc47f1
3
+ size 42115
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31203e9e154f5c3fd2516840155b0b6a2ca0065820e7bbcdc888839c05c9c211
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1878d7ce68a62c1e36ee52442a7ba512ccfe5685ea9bcd549faafe28cbb6aa3
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0040e0b686c84aace19b20a678f545cb756d1b74b1d23bf3ae62939b7bc4603f
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:557fb59a319d0b9ffcb97b02d3285016a21f80e239f4c43c5c54fa77c4ca8a2c
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b20b33489b01f4f2d1399017b1a58699f01d8fe4ed47d7762a94601baf0ef4b5
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8d1219ae8f617ce5bf189ffa179008d37ceb49f6bda1558c2c0e805e7593874
3
+ size 42115
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3cab03cfef52a20680f9a8c3df6ae7996f40193679909bca5359d1e027f566c5
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f6f9f3d578616fbe8f211cd4a8ab7882e17b43aa3ebdb3f6efb03efb33e5cf0
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8247d35386523c55947a55e64096c8027912980df221866f92db6075ddeab30
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72d20c31899e82ab70ff78cd8fa2c8a0a3a43abdd31795be35350c4c492baaba
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4bf349dbc250e89eb1f81339bb2c6a0ee8f88bee0c7186e27d44fabb3d002c5e
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1a94bed1d7b45d30ed7cdc0c6de22816f15651c930e0ebff63db907d9e44951
3
+ size 42115
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3fb05676516a2e4450287ec07305930184f1b2a543c4033e5c2351d0ffe65e2
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a22c4cf2d7b29145665f5bc5b7e6848f05a2c8c3addcc96e375f4e7addc6a819
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:605317d2ac75126a12f1d8a9dd4b7a17b813a498abed67805238f552fa8d07bf
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a3ef534cc429817f0a2ee11163cccba92c7b299f78b2783c38eb85c9f81c03a
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e34383e007dda1a5c8fe9ca354829db179423ceae651df381f8bd9afb6aa59ea
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e624237b9f1feb4bf8ad92e040ce21a4c51552bd7886293d22df62c8da1f7c39
3
+ size 42115
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f074476e368926186f348dd1d8157ab427d69601f575824d1227814c4df75ebc
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a31e8b7f7a02ac617c42eb0fcffa9925718fdb63d564ce524be16cf0d00b266a
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b7f839cd5bf62d1eaa1e6efe80bc2e3df50abcbc22ce9d07b0cc1d42f54fd7b
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef5b3b224eb3f2711cc00c516329b87db2acab2562b9f8a8cdb5065dafc945d3
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d53893725fb6bd96e357667901a6393598daeb1fbfbb7342774e425ff5495f29
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5471c2bc15fcb80d7ad40c1451b47ef34b38d547f70054f34f0ae27dbeacd462
3
+ size 42115
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0315870d83ed80c9e9b92687474a3c85f28a288ef2c9ab8b285a113143aeebfc
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a10a055b86452a1bed4d22d0b837e0b6b1d87784ba24221f95806a55b803396
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2461e1d10d0c7ec5b5062ef31169c180de3d0e57ee4603e57355fa1a37ce7f6d
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30b797753c3d9d960b646a283864fb06ab5c376e7976136f950224787d25ca68
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ecc55167efe69fd95806e47045459a6907b2c56e8af37a3e9a2a538f195f833e
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.16.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af778e63338570cced2cec406ba901fbf3da530479011fb4e359816db7ffa836
3
+ size 42115