Adding more results
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- params/phi/4/rnd_search_t_no_sched/comb_18/init/lm_head/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.v_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.v_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.v_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.v_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.v_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.16.mlp.fc1/_s.pt +3 -0
params/phi/4/rnd_search_t_no_sched/comb_18/init/lm_head/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:51c11ffa139f77bca740c212a2298c0e5fdfe1b9394cfd352de013fbf56d6bf5
|
3 |
+
size 205955
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb805f947113f00b22822a99b43c46eec6bae18b0220696cb4cc4df6da44200e
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:075949d700797a1158594778650381b933bf2a4de5553afbb9a69f224056ace7
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1255b476389a23dc6c7eb650f83753ae92acd69eaefae4005198debe409bc857
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2aab51b6beb5caff267c772b27514bde4c8ea150c56aa4220aecd8a7e8b3c536
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:13105c640a58ff07b260ceba6507d64a8363f949dff3131434179129a884c246
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:40f53147761badd3cad324b505d5e6b58a6edd94d2b370c4cd0257f1731a6168
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1ed1e49494b3688a11ca6f0b83ec7d3271941a6c7b2d60aac48cbe7df1cce08b
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a8ddc4e59cac74bc658fe17b57039258829df64ef32a1c6eda907ec3015d03c
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2d5d22bbdd9bafb6a4169f8937ba21d500072fd2cc2b647ec34c880e69390672
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4dfa40fb99152219952d44562574af17c3dd625bfc3d3a2050e9e7bf58460470
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:98a349b794e1e78c303fa4676e3d1116aa3743f57c88cacc341cc1b2417d9e10
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b8da6720a87c5359e9ada9fb8c0a8038b1f9cd9f120b8cd6ad7af6ee2b184997
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:45125d4b1998dcb15d9278b27bc37e325628afcad2d8de0acc422009beb99bb3
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:086e0d187f38b1fad2a94a92656ef45e031607b7cd9c5ed5727978defda06e7c
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:927f3973ae3bbd9672f58c6e6656d5e098d8c4b29fd7556b3c2491ad8a3c950a
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8eef33c1565532bbc77282cb482c58051fc7e8c8b8a424076e1fddd3b4f95b5a
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd82d3da9be519209a0b6049379dcbdaf9fda24ec39092ded652faf956321313
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a0b862e0ad89e1f19a7006148040f7ad988ffc6bf25fdc4b18c0319d76a71bdf
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:85f31ebd41c2450a64e25fdc5db2e5acdcfc8fa60c61c60ed80faa9aa4dc47f1
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31203e9e154f5c3fd2516840155b0b6a2ca0065820e7bbcdc888839c05c9c211
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d1878d7ce68a62c1e36ee52442a7ba512ccfe5685ea9bcd549faafe28cbb6aa3
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0040e0b686c84aace19b20a678f545cb756d1b74b1d23bf3ae62939b7bc4603f
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:557fb59a319d0b9ffcb97b02d3285016a21f80e239f4c43c5c54fa77c4ca8a2c
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b20b33489b01f4f2d1399017b1a58699f01d8fe4ed47d7762a94601baf0ef4b5
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b8d1219ae8f617ce5bf189ffa179008d37ceb49f6bda1558c2c0e805e7593874
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3cab03cfef52a20680f9a8c3df6ae7996f40193679909bca5359d1e027f566c5
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f6f9f3d578616fbe8f211cd4a8ab7882e17b43aa3ebdb3f6efb03efb33e5cf0
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c8247d35386523c55947a55e64096c8027912980df221866f92db6075ddeab30
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:72d20c31899e82ab70ff78cd8fa2c8a0a3a43abdd31795be35350c4c492baaba
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4bf349dbc250e89eb1f81339bb2c6a0ee8f88bee0c7186e27d44fabb3d002c5e
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b1a94bed1d7b45d30ed7cdc0c6de22816f15651c930e0ebff63db907d9e44951
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3fb05676516a2e4450287ec07305930184f1b2a543c4033e5c2351d0ffe65e2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a22c4cf2d7b29145665f5bc5b7e6848f05a2c8c3addcc96e375f4e7addc6a819
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:605317d2ac75126a12f1d8a9dd4b7a17b813a498abed67805238f552fa8d07bf
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1a3ef534cc429817f0a2ee11163cccba92c7b299f78b2783c38eb85c9f81c03a
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e34383e007dda1a5c8fe9ca354829db179423ceae651df381f8bd9afb6aa59ea
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e624237b9f1feb4bf8ad92e040ce21a4c51552bd7886293d22df62c8da1f7c39
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f074476e368926186f348dd1d8157ab427d69601f575824d1227814c4df75ebc
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a31e8b7f7a02ac617c42eb0fcffa9925718fdb63d564ce524be16cf0d00b266a
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b7f839cd5bf62d1eaa1e6efe80bc2e3df50abcbc22ce9d07b0cc1d42f54fd7b
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ef5b3b224eb3f2711cc00c516329b87db2acab2562b9f8a8cdb5065dafc945d3
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d53893725fb6bd96e357667901a6393598daeb1fbfbb7342774e425ff5495f29
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5471c2bc15fcb80d7ad40c1451b47ef34b38d547f70054f34f0ae27dbeacd462
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0315870d83ed80c9e9b92687474a3c85f28a288ef2c9ab8b285a113143aeebfc
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1a10a055b86452a1bed4d22d0b837e0b6b1d87784ba24221f95806a55b803396
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2461e1d10d0c7ec5b5062ef31169c180de3d0e57ee4603e57355fa1a37ce7f6d
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:30b797753c3d9d960b646a283864fb06ab5c376e7976136f950224787d25ca68
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ecc55167efe69fd95806e47045459a6907b2c56e8af37a3e9a2a538f195f833e
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_18/init/model.layers.16.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:af778e63338570cced2cec406ba901fbf3da530479011fb4e359816db7ffa836
|
3 |
+
size 42115
|