Training in progress, epoch 1
Browse files- .gitattributes +1 -0
- .gitignore +1 -0
- config.json +40 -0
- pytorch_model.bin +3 -0
- runs/Jun15_10-24-21_dfcef795325b/1655288694.3531384/events.out.tfevents.1655288694.dfcef795325b.82.1 +3 -0
- runs/Jun15_10-24-21_dfcef795325b/events.out.tfevents.1655288694.dfcef795325b.82.0 +3 -0
- runs/Jun15_10-27-00_dfcef795325b/1655288888.3831806/events.out.tfevents.1655288888.dfcef795325b.82.3 +3 -0
- runs/Jun15_10-27-00_dfcef795325b/events.out.tfevents.1655288888.dfcef795325b.82.2 +3 -0
- runs/Jun15_10-33-04_dfcef795325b/1655289198.7075686/events.out.tfevents.1655289198.dfcef795325b.522.1 +3 -0
- runs/Jun15_10-33-04_dfcef795325b/events.out.tfevents.1655289198.dfcef795325b.522.0 +3 -0
- runs/Jun15_10-44-34_dfcef795325b/1655289887.5414565/events.out.tfevents.1655289887.dfcef795325b.799.1 +3 -0
- runs/Jun15_10-44-34_dfcef795325b/events.out.tfevents.1655289887.dfcef795325b.799.0 +3 -0
- runs/Jun15_10-57-52_dfcef795325b/1655290687.6443229/events.out.tfevents.1655290687.dfcef795325b.1148.1 +3 -0
- runs/Jun15_10-57-52_dfcef795325b/events.out.tfevents.1655290687.dfcef795325b.1148.0 +3 -0
- runs/Jun15_11-03-13_dfcef795325b/1655291008.2963707/events.out.tfevents.1655291008.dfcef795325b.1345.1 +3 -0
- runs/Jun15_11-03-13_dfcef795325b/events.out.tfevents.1655291008.dfcef795325b.1345.0 +3 -0
- special_tokens_map.json +1 -0
- tokenizer.json +3 -0
- tokenizer_config.json +1 -0
- training_args.bin +3 -0
.gitattributes
CHANGED
@@ -25,3 +25,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
25 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
26 |
*.zstandard filter=lfs diff=lfs merge=lfs -text
|
27 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
25 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
26 |
*.zstandard filter=lfs diff=lfs merge=lfs -text
|
27 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
28 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
.gitignore
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
checkpoint-*/
|
config.json
ADDED
@@ -0,0 +1,40 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "joeddav/xlm-roberta-large-xnli",
|
3 |
+
"architectures": [
|
4 |
+
"XLMRobertaForSequenceClassification"
|
5 |
+
],
|
6 |
+
"attention_probs_dropout_prob": 0.1,
|
7 |
+
"bos_token_id": 0,
|
8 |
+
"classifier_dropout": null,
|
9 |
+
"eos_token_id": 2,
|
10 |
+
"gradient_checkpointing": false,
|
11 |
+
"hidden_act": "gelu",
|
12 |
+
"hidden_dropout_prob": 0.1,
|
13 |
+
"hidden_size": 1024,
|
14 |
+
"id2label": {
|
15 |
+
"0": "contradiction",
|
16 |
+
"1": "neutral",
|
17 |
+
"2": "entailment"
|
18 |
+
},
|
19 |
+
"initializer_range": 0.02,
|
20 |
+
"intermediate_size": 4096,
|
21 |
+
"label2id": {
|
22 |
+
"contradiction": 0,
|
23 |
+
"entailment": 2,
|
24 |
+
"neutral": 1
|
25 |
+
},
|
26 |
+
"layer_norm_eps": 1e-05,
|
27 |
+
"max_position_embeddings": 514,
|
28 |
+
"model_type": "xlm-roberta",
|
29 |
+
"num_attention_heads": 16,
|
30 |
+
"num_hidden_layers": 24,
|
31 |
+
"output_past": true,
|
32 |
+
"pad_token_id": 1,
|
33 |
+
"position_embedding_type": "absolute",
|
34 |
+
"problem_type": "single_label_classification",
|
35 |
+
"torch_dtype": "float32",
|
36 |
+
"transformers_version": "4.19.4",
|
37 |
+
"type_vocab_size": 1,
|
38 |
+
"use_cache": true,
|
39 |
+
"vocab_size": 250002
|
40 |
+
}
|
pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:73a2d5351ba3c556e6f7252b3861f7049ab52e247377801b23c32acd875112ef
|
3 |
+
size 2239711213
|
runs/Jun15_10-24-21_dfcef795325b/1655288694.3531384/events.out.tfevents.1655288694.dfcef795325b.82.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0429f588b44a2671823e719accd45b0d0f98e50d909ade5a61f81509cf92903c
|
3 |
+
size 5227
|
runs/Jun15_10-24-21_dfcef795325b/events.out.tfevents.1655288694.dfcef795325b.82.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cb1a893810f84592649bfab095472f26052163c2ffe92bace6fa98b4cef627df
|
3 |
+
size 3850
|
runs/Jun15_10-27-00_dfcef795325b/1655288888.3831806/events.out.tfevents.1655288888.dfcef795325b.82.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e7c6a0a570bd6443857716762218b01f538991a6297016d95a71b7e0d412f0ba
|
3 |
+
size 5227
|
runs/Jun15_10-27-00_dfcef795325b/events.out.tfevents.1655288888.dfcef795325b.82.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fa855e97631e0e89c03f662e9b8a0195eea3b4a3a9916e53c769763a9e2b4a19
|
3 |
+
size 3897
|
runs/Jun15_10-33-04_dfcef795325b/1655289198.7075686/events.out.tfevents.1655289198.dfcef795325b.522.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d02b836afe1f7432d002183bf207eecae56a6c9e513fcecb06087b3e05158029
|
3 |
+
size 5227
|
runs/Jun15_10-33-04_dfcef795325b/events.out.tfevents.1655289198.dfcef795325b.522.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dc723647bb1052c808b913e10c3f4aa3f8d084c30937f56ffbd33b7de506517c
|
3 |
+
size 3848
|
runs/Jun15_10-44-34_dfcef795325b/1655289887.5414565/events.out.tfevents.1655289887.dfcef795325b.799.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:635e2c94c23b50e0132326382ef7b85b58a4ef3fde27913226077256c9d4b9f2
|
3 |
+
size 5227
|
runs/Jun15_10-44-34_dfcef795325b/events.out.tfevents.1655289887.dfcef795325b.799.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7be3822bb8ae886137971202a06d3c2583d87d77c1dad29ce84c0f12143b17d7
|
3 |
+
size 4476
|
runs/Jun15_10-57-52_dfcef795325b/1655290687.6443229/events.out.tfevents.1655290687.dfcef795325b.1148.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cb92c679b8a7684b3f8991d8a36dbda9c0d505a67e9efa91c261e50d42c648e6
|
3 |
+
size 5227
|
runs/Jun15_10-57-52_dfcef795325b/events.out.tfevents.1655290687.dfcef795325b.1148.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6b904cfd70413c9fb49fef930b9673318ce9343c9284a78e0fd0e2952a6e381d
|
3 |
+
size 4005
|
runs/Jun15_11-03-13_dfcef795325b/1655291008.2963707/events.out.tfevents.1655291008.dfcef795325b.1345.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:79fd9790f3adc8e53ad33ba8d94ea1217f9910f04c7718089b06a27ce6dab1f7
|
3 |
+
size 5227
|
runs/Jun15_11-03-13_dfcef795325b/events.out.tfevents.1655291008.dfcef795325b.1345.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:024bc8206745c1dd045f334de140a7863aba1907c484544d235e67fb451b5eca
|
3 |
+
size 4799
|
special_tokens_map.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"bos_token": "<s>", "eos_token": "</s>", "unk_token": "<unk>", "sep_token": "</s>", "pad_token": "<pad>", "cls_token": "<s>", "mask_token": {"content": "<mask>", "single_word": false, "lstrip": true, "rstrip": false, "normalized": false}}
|
tokenizer.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f2c509a525eb51aebb33fb59c24ee923c1d4c1db23c3ae81fe05ccf354084f7b
|
3 |
+
size 17082758
|
tokenizer_config.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"bos_token": "<s>", "eos_token": "</s>", "sep_token": "</s>", "cls_token": "<s>", "unk_token": "<unk>", "pad_token": "<pad>", "mask_token": {"content": "<mask>", "single_word": false, "lstrip": true, "rstrip": false, "normalized": true, "__type": "AddedToken"}, "model_max_length": 512, "special_tokens_map_file": null, "name_or_path": "xlm-roberta-large", "tokenizer_class": "XLMRobertaTokenizer"}
|
training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:558fc11324bc668c3f3c133007da090a6344533703fdc0c7f070a52f13ec34cc
|
3 |
+
size 3247
|