Saving weights and logs of step 750000
Browse files
config.json
CHANGED
@@ -19,10 +19,11 @@
|
|
19 |
"num_heads": 6,
|
20 |
"num_layers": 12,
|
21 |
"pad_token_id": 0,
|
|
|
22 |
"relative_attention_num_buckets": 32,
|
23 |
"tie_word_embeddings": false,
|
24 |
"tokenizer_class": "ByT5Tokenizer",
|
25 |
-
"transformers_version": "4.
|
26 |
"use_cache": true,
|
27 |
"vocab_size": 384
|
28 |
}
|
|
|
19 |
"num_heads": 6,
|
20 |
"num_layers": 12,
|
21 |
"pad_token_id": 0,
|
22 |
+
"relative_attention_max_distance": 128,
|
23 |
"relative_attention_num_buckets": 32,
|
24 |
"tie_word_embeddings": false,
|
25 |
"tokenizer_class": "ByT5Tokenizer",
|
26 |
+
"transformers_version": "4.19.0.dev0",
|
27 |
"use_cache": true,
|
28 |
"vocab_size": 384
|
29 |
}
|
events.out.tfevents.1650288432.t1v-n-fb181105-w-0.193063.0.v2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:125d6cd3bb7de3ac6796f2d02425856bfe11d0b33003910371f7d36e50a06cb6
|
3 |
+
size 37258932
|
flax_model.msgpack
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1198558445
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:70f7a8c616d676b09cf3d1fcfe7c0b9a42f8ea22c2afec3047e7c943921a3b7a
|
3 |
size 1198558445
|