lrl-modelcloud's picture
Upload folder using huggingface_hub (#1)
6805f88 verified
raw
history blame
6.92 kB
layer,module,loss,damp,time
0,self_attn.k_proj,0.00669,0.10000,0.572
0,self_attn.v_proj,0.00015,0.10000,0.366
0,self_attn.q_proj,0.04556,0.10000,0.369
0,self_attn.o_proj,0.00003,0.10000,0.365
0,mlp.up_proj,0.57997,0.10000,0.394
0,mlp.gate_proj,0.91966,0.10000,0.393
0,mlp.down_proj,0.01179,0.10000,1.944
1,self_attn.k_proj,0.06515,0.10000,0.361
1,self_attn.v_proj,0.00657,0.10000,0.371
1,self_attn.q_proj,0.22341,0.10000,0.374
1,self_attn.o_proj,0.00404,0.10000,0.374
1,mlp.up_proj,0.78053,0.10000,0.401
1,mlp.gate_proj,1.47476,0.10000,0.398
1,mlp.down_proj,0.01116,0.10000,1.960
2,self_attn.k_proj,0.13747,0.10000,0.371
2,self_attn.v_proj,0.01578,0.10000,0.367
2,self_attn.q_proj,0.46999,0.10000,0.372
2,self_attn.o_proj,0.00497,0.10000,0.370
2,mlp.up_proj,1.05533,0.10000,0.400
2,mlp.gate_proj,1.95990,0.10000,0.395
2,mlp.down_proj,0.54380,0.10000,2.036
3,self_attn.k_proj,0.14006,0.10000,0.365
3,self_attn.v_proj,0.03060,0.10000,0.370
3,self_attn.q_proj,0.59166,0.10000,0.380
3,self_attn.o_proj,0.00675,0.10000,0.380
3,mlp.up_proj,1.98003,0.10000,0.401
3,mlp.gate_proj,3.62075,0.10000,0.396
3,mlp.down_proj,0.64975,0.10000,2.032
4,self_attn.k_proj,0.09814,0.10000,0.366
4,self_attn.v_proj,0.04382,0.10000,0.366
4,self_attn.q_proj,0.46673,0.10000,0.373
4,self_attn.o_proj,0.01211,0.10000,0.377
4,mlp.up_proj,1.58077,0.10000,0.401
4,mlp.gate_proj,2.47939,0.10000,0.397
4,mlp.down_proj,0.03189,0.10000,1.972
5,self_attn.k_proj,0.12246,0.10000,0.368
5,self_attn.v_proj,0.05167,0.10000,0.368
5,self_attn.q_proj,0.61106,0.10000,0.373
5,self_attn.o_proj,0.01123,0.10000,0.375
5,mlp.up_proj,2.01079,0.10000,0.406
5,mlp.gate_proj,4.08619,0.10000,0.396
5,mlp.down_proj,0.03081,0.10000,1.992
6,self_attn.k_proj,0.11447,0.10000,0.363
6,self_attn.v_proj,0.03224,0.10000,0.361
6,self_attn.q_proj,0.50002,0.10000,0.371
6,self_attn.o_proj,0.01039,0.10000,0.371
6,mlp.up_proj,1.59279,0.10000,0.403
6,mlp.gate_proj,2.33140,0.10000,0.424
6,mlp.down_proj,0.03129,0.10000,1.943
7,self_attn.k_proj,0.17277,0.10000,0.363
7,self_attn.v_proj,0.04741,0.10000,0.364
7,self_attn.q_proj,0.70939,0.10000,0.370
7,self_attn.o_proj,0.01649,0.10000,0.373
7,mlp.up_proj,1.71943,0.10000,0.401
7,mlp.gate_proj,2.22081,0.10000,0.397
7,mlp.down_proj,0.03903,0.10000,1.962
8,self_attn.k_proj,0.11656,0.10000,0.360
8,self_attn.v_proj,0.04624,0.10000,0.365
8,self_attn.q_proj,0.79887,0.10000,0.371
8,self_attn.o_proj,0.02273,0.10000,0.368
8,mlp.up_proj,1.43981,0.10000,0.413
8,mlp.gate_proj,1.95721,0.10000,0.397
8,mlp.down_proj,0.02604,0.10000,1.942
9,self_attn.k_proj,0.33948,0.10000,0.362
9,self_attn.v_proj,0.08356,0.10000,0.362
9,self_attn.q_proj,1.38756,0.10000,0.373
9,self_attn.o_proj,0.01633,0.10000,0.374
9,mlp.up_proj,1.48946,0.10000,0.400
9,mlp.gate_proj,1.75232,0.10000,0.396
9,mlp.down_proj,0.02843,0.10000,1.953
10,self_attn.k_proj,0.10033,0.10000,0.365
10,self_attn.v_proj,0.06627,0.10000,0.364
10,self_attn.q_proj,0.50354,0.10000,0.375
10,self_attn.o_proj,0.02601,0.10000,0.373
10,mlp.up_proj,1.28366,0.10000,0.400
10,mlp.gate_proj,1.68165,0.10000,0.395
10,mlp.down_proj,0.02453,0.10000,1.970
11,self_attn.k_proj,0.35640,0.10000,0.364
11,self_attn.v_proj,0.08797,0.10000,0.363
11,self_attn.q_proj,1.44697,0.10000,0.373
11,self_attn.o_proj,0.01708,0.10000,0.374
11,mlp.up_proj,1.46764,0.10000,0.400
11,mlp.gate_proj,1.59477,0.10000,0.403
11,mlp.down_proj,0.03929,0.10000,1.959
12,self_attn.k_proj,0.09292,0.10000,0.366
12,self_attn.v_proj,0.06008,0.10000,0.366
12,self_attn.q_proj,0.50941,0.10000,0.376
12,self_attn.o_proj,0.02493,0.10000,0.407
12,mlp.up_proj,1.36413,0.10000,0.420
12,mlp.gate_proj,1.50805,0.10000,0.423
12,mlp.down_proj,0.02825,0.10000,2.090
13,self_attn.k_proj,0.17860,0.10000,0.391
13,self_attn.v_proj,0.06740,0.10000,0.392
13,self_attn.q_proj,0.91921,0.10000,0.375
13,self_attn.o_proj,0.02215,0.10000,0.405
13,mlp.up_proj,1.60880,0.10000,0.428
13,mlp.gate_proj,1.61348,0.10000,0.419
13,mlp.down_proj,0.03996,0.10000,1.946
14,self_attn.k_proj,0.12914,0.10000,0.363
14,self_attn.v_proj,0.10303,0.10000,0.360
14,self_attn.q_proj,0.79523,0.10000,0.370
14,self_attn.o_proj,0.04685,0.10000,0.372
14,mlp.up_proj,1.58363,0.10000,0.395
14,mlp.gate_proj,1.77731,0.10000,0.392
14,mlp.down_proj,0.04859,0.10000,1.937
15,self_attn.k_proj,0.13345,0.10000,0.362
15,self_attn.v_proj,0.08482,0.10000,0.361
15,self_attn.q_proj,0.72791,0.10000,0.372
15,self_attn.o_proj,0.03135,0.10000,0.371
15,mlp.up_proj,2.07139,0.10000,0.398
15,mlp.gate_proj,2.14117,0.10000,0.393
15,mlp.down_proj,0.06882,0.10000,2.049
16,self_attn.k_proj,0.25867,0.10000,0.366
16,self_attn.v_proj,0.23036,0.10000,0.368
16,self_attn.q_proj,1.52680,0.10000,0.372
16,self_attn.o_proj,0.03056,0.10000,0.404
16,mlp.up_proj,2.59174,0.10000,0.404
16,mlp.gate_proj,3.33505,0.10000,0.403
16,mlp.down_proj,0.12967,0.10000,2.131
17,self_attn.k_proj,0.15921,0.10000,0.364
17,self_attn.v_proj,0.14702,0.10000,0.363
17,self_attn.q_proj,1.03912,0.10000,0.379
17,self_attn.o_proj,0.02504,0.10000,0.373
17,mlp.up_proj,2.94703,0.10000,0.400
17,mlp.gate_proj,4.60301,0.10000,0.399
17,mlp.down_proj,0.10250,0.10000,2.064
18,self_attn.k_proj,0.17395,0.10000,0.362
18,self_attn.v_proj,0.13174,0.10000,0.361
18,self_attn.q_proj,1.01365,0.10000,0.377
18,self_attn.o_proj,0.02879,0.10000,0.382
18,mlp.up_proj,2.89602,0.10000,0.416
18,mlp.gate_proj,3.61816,0.10000,0.394
18,mlp.down_proj,0.11206,0.10000,2.045
19,self_attn.k_proj,0.15185,0.10000,0.365
19,self_attn.v_proj,0.12662,0.10000,0.366
19,self_attn.q_proj,0.91668,0.10000,0.372
19,self_attn.o_proj,0.04191,0.10000,0.377
19,mlp.up_proj,4.22402,0.10000,0.402
19,mlp.gate_proj,5.07732,0.10000,0.397
19,mlp.down_proj,0.21600,0.10000,1.942
20,self_attn.k_proj,0.21450,0.10000,0.368
20,self_attn.v_proj,0.46156,0.10000,0.375
20,self_attn.q_proj,1.34480,0.10000,0.383
20,self_attn.o_proj,0.07874,0.10000,0.373
20,mlp.up_proj,4.72404,0.10000,0.405
20,mlp.gate_proj,5.23060,0.10000,0.420
20,mlp.down_proj,0.30142,0.10000,1.931
21,self_attn.k_proj,0.25363,0.10000,0.363
21,self_attn.v_proj,0.68723,0.10000,0.361
21,self_attn.q_proj,1.54567,0.10000,0.371
21,self_attn.o_proj,0.19063,0.10000,0.373
21,mlp.up_proj,4.74235,0.10000,0.399
21,mlp.gate_proj,5.02750,0.10000,0.393
21,mlp.down_proj,1.48262,0.10000,1.988
22,self_attn.k_proj,0.24376,0.10000,0.361
22,self_attn.v_proj,0.69571,0.10000,0.368
22,self_attn.q_proj,1.45133,0.10000,0.380
22,self_attn.o_proj,0.05970,0.10000,0.381
22,mlp.up_proj,4.15480,0.10000,0.406
22,mlp.gate_proj,3.93745,0.10000,0.398
22,mlp.down_proj,0.47177,0.10000,1.975
23,self_attn.k_proj,0.30426,0.10000,0.368
23,self_attn.v_proj,0.64836,0.10000,0.365
23,self_attn.q_proj,1.41738,0.10000,0.374
23,self_attn.o_proj,0.18444,0.10000,0.374
23,mlp.up_proj,4.43292,0.10000,0.401
23,mlp.gate_proj,4.59121,0.10000,0.397
23,mlp.down_proj,0.96985,0.10000,1.943