|
Layer,Mode,Rank,Alpha,Dropout,Weight_lr_init,Weight_lr_final,Weight_decay,State_lr_init,State_lr_final,RejectParts |
|
emb,freeze,0,0,0.01,0.000001,0.0000001,0.01,0.05,0.01, |
|
0,bone,256,32,0.01,5.00E-05,1.00E-05,0.01,0.05,0.01, |
|
1,bone,256,32,0.01,5.00E-05,1.00E-05,0.01,0.05,0.01, |
|
2,bone,256,32,0.01,5.00E-05,1.00E-05,0.01,0.05,0.01, |
|
3,bone,256,32,0.01,5.00E-05,1.00E-05,0.01,0.05,0.01, |
|
4,bone,256,32,0.01,5.00E-05,1.00E-05,0.01,0.05,0.01, |
|
5,bone,256,32,0.01,5.00E-05,1.00E-05,0.01,0.05,0.01, |
|
6,bone,256,32,0.01,5.00E-05,1.00E-05,0.01,0.05,0.01, |
|
7,bone,256,32,0.01,5.00E-05,1.00E-05,0.01,0.05,0.01, |
|
8,bone,256,32,0.01,5.00E-05,1.00E-05,0.01,0.05,0.01, |
|
9,bone,256,32,0.01,5.00E-05,1.00E-05,0.01,0.05,0.01, |
|
10,bone,256,32,0.01,5.00E-05,1.00E-05,0.01,0.05,0.01, |
|
11,bone,256,32,0.01,5.00E-05,1.00E-05,0.01,0.05,0.01, |
|
12,bone,256,32,0.01,5.00E-05,1.00E-05,0.01,0.05,0.01, |
|
13,bone,512,32,0.01,5.00E-05,1.00E-05,0.01,0.05,0.01, |
|
14,bone,512,32,0.01,5.00E-05,1.00E-05,0.01,0.05,0.01, |
|
15,bone,512,32,0.01,5.00E-05,1.00E-05,0.01,0.05,0.01, |
|
16,bone,512,32,0.01,5.00E-05,1.00E-05,0.01,0.05,0.01, |
|
17,bone,512,32,0.01,5.00E-05,1.00E-05,0.01,0.05,0.01, |
|
18,bone,512,32,0.01,5.00E-05,1.00E-05,0.01,0.05,0.01, |
|
19,bone,512,32,0.01,5.00E-05,1.00E-05,0.01,0.05,0.01, |
|
20,bone,512,32,0.01,5.00E-05,1.00E-05,0.01,0.05,0.01, |
|
21,bone,512,32,0.01,5.00E-05,1.00E-05,0.01,0.05,0.01, |
|
22,bone,512,32,0.01,5.00E-05,1.00E-05,0.01,0.05,0.01, |
|
23,bone,512,32,0.01,5.00E-05,1.00E-05,0.01,0.05,0.01, |
|
24,full,1280,32,0.01,5.00E-05,1.00E-05,0.01,0.05,0.01, |
|
25,full,1280,32,0.01,5.00E-05,1.00E-05,0.01,0.05,0.01, |
|
26,full,1024,32,0.01,5.00E-05,1.00E-05,0.01,0.05,0.01, |
|
27,full,1024,32,0.01,5.00E-05,1.00E-05,0.01,0.05,0.01, |
|
28,full,1024,32,0.01,5.00E-05,1.00E-05,0.01,0.05,0.01, |
|
29,full,1024,32,0.01,5.00E-05,1.00E-05,0.01,0.05,0.01, |
|
30,full,1024,32,0.01,5.00E-05,1.00E-05,0.01,0.05,0.01, |
|
31,full,1024,32,0.01,5.00E-05,1.00E-05,0.01,0.05,0.01, |
|
head,full,512,32,0.01,0.00001,0.000001,0.01,0.05,0.01, |
|
|