aapot
commited on
Commit
•
2ebfd3b
1
Parent(s):
0790246
Add 290k train step and HF flax model
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- checkpoint_290000/checkpoint +3 -0
- checkpoint_290000/state.param_states.decoder.decoder_norm.scale.v/.zarray +3 -0
- checkpoint_290000/state.param_states.decoder.decoder_norm.scale.v/0 +3 -0
- checkpoint_290000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_290000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_290000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_290000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_290000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_290000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_290000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_290000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_290000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_290000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_290000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_290000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_290000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_290000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_290000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_290000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_290000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_290000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_290000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_290000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_290000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_290000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_290000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_290000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_290000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_290000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_290000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_290000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_290000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_290000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_290000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_290000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_290000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_290000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_290000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_290000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_290000/state.param_states.decoder.layers_6.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_290000/state.param_states.decoder.layers_6.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_290000/state.param_states.decoder.layers_6.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_290000/state.param_states.decoder.layers_6.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_290000/state.param_states.decoder.layers_6.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_290000/state.param_states.decoder.layers_6.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_290000/state.param_states.decoder.layers_7.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_290000/state.param_states.decoder.layers_7.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_290000/state.param_states.decoder.layers_7.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_290000/state.param_states.decoder.layers_7.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_290000/state.param_states.decoder.layers_7.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
checkpoint_290000/checkpoint
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31e6d94765266375caa47d7b6ac289478a9995e0147633f22afe334e433d5a5f
|
3 |
+
size 1037969
|
checkpoint_290000/state.param_states.decoder.decoder_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_290000/state.param_states.decoder.decoder_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:50a485338495b1f4ea274c2ea844b7d72b81949609c8d1bface811190708fc4d
|
3 |
+
size 1416
|
checkpoint_290000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_290000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:299db7a9356e0183fcbb808fb707f71b21f189ff1160eef5bd6b4a916523cbd7
|
3 |
+
size 1435
|
checkpoint_290000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_290000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fe9d6cc2a7841316e4ef9e8376c1d9dafcfd490f251d9cc1ca85a6da03af4992
|
3 |
+
size 1373
|
checkpoint_290000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_290000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:24c56cca24608546660b818edddde684098f376eb0c475c34b84990ecd729e12
|
3 |
+
size 1442
|
checkpoint_290000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_290000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8d4918556b2cc9bb6734f47f535ce920b6e12e202377bfe01a457d50081bcd91
|
3 |
+
size 1432
|
checkpoint_290000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_290000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:79711bb0bceafc9d9788365b4fc9327c27945c90ac3683e90cfae0fe1c097880
|
3 |
+
size 1426
|
checkpoint_290000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_290000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:db48f4f343a23689d7b56b74a59ec19ef5ffc459b677021364063e86f9a2455e
|
3 |
+
size 1453
|
checkpoint_290000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_290000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c562697ccf452c4754aaf8c8b6282346d28da072aae8b99cf338cd3b9cb1be80
|
3 |
+
size 1435
|
checkpoint_290000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_290000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:41226f2c275331a0a347a794407b2042f4c4f01f67e998dded86d2fae40f580f
|
3 |
+
size 1437
|
checkpoint_290000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_290000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9cc64503152fafcd064bda7fc766dae7857313819d0e8ed0b3c667c764d0ebdb
|
3 |
+
size 1432
|
checkpoint_290000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_290000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:82e6c99e267f43c7cbd2fe9f6d846b5c4ba059f2e9761ce0a1da471f79929b6a
|
3 |
+
size 1418
|
checkpoint_290000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_290000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:45b63c955659ff041aac339eb950ef5ff7cd3004f759a5606b031b78573e65a7
|
3 |
+
size 1390
|
checkpoint_290000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_290000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0de6d022adc0018e81138087bee1af95a01a7ca41177d86afba5062b92f90ef1
|
3 |
+
size 1396
|
checkpoint_290000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_290000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4cb120b470bb5ef2ba2c182d12ca0222b75c7d1757c3b5fee6fa6a97af6d5642
|
3 |
+
size 1406
|
checkpoint_290000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_290000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e178c1ef25f7ebef2bb6d59b97ac2c98885d0a634a66a3fbab69da748db9694f
|
3 |
+
size 1384
|
checkpoint_290000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_290000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:271ebaff2688e1ce5820ef0b627610c562454a9f72e31513db8ac67163022ddb
|
3 |
+
size 1400
|
checkpoint_290000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_290000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e211529484d4d5277c0445778d427ffdd490462a12ae374d367da6adc4688410
|
3 |
+
size 1413
|
checkpoint_290000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_290000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:61401b8e6b7de32051e4f43e9774f4ea637753456351e5945b64c2797650a9fb
|
3 |
+
size 1378
|
checkpoint_290000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_290000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e266fd746687590d8720d4b7c8c757b3929027f7ca6ad3e7f3780dc8054bd4c7
|
3 |
+
size 1389
|
checkpoint_290000/state.param_states.decoder.layers_6.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_290000/state.param_states.decoder.layers_6.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:57d93e632e7e4d8461875ecf0b31d8606f79ab6dc50f30999e89a7d4c3d09f7e
|
3 |
+
size 1408
|
checkpoint_290000/state.param_states.decoder.layers_6.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_290000/state.param_states.decoder.layers_6.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b4b8aebb1d9bd8baf37886fd18c58972cf147c05ed84bd388565715e8915699
|
3 |
+
size 1375
|
checkpoint_290000/state.param_states.decoder.layers_6.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_290000/state.param_states.decoder.layers_6.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d63231045a4f13d566f9fe9cb997500484cfcb481fd539488dc243863cd51a9c
|
3 |
+
size 1398
|
checkpoint_290000/state.param_states.decoder.layers_7.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_290000/state.param_states.decoder.layers_7.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8112349e3cd6287c6cd09f1a38884024d9bbf683eabceec5b81acadcc22e2e8a
|
3 |
+
size 1431
|
checkpoint_290000/state.param_states.decoder.layers_7.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_290000/state.param_states.decoder.layers_7.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fa17da939c1ff1c6abb88145965aa8c46ee3d43f42dda191247822336145b224
|
3 |
+
size 1427
|
checkpoint_290000/state.param_states.decoder.layers_7.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|