marcus2000
commited on
Commit
•
679a442
1
Parent(s):
41e15c7
Training in progress, step 1
Browse files- .gitignore +1 -0
- added_tokens.json +5 -0
- config.json +68 -0
- merges.txt +0 -0
- pytorch_model.bin +3 -0
- runs/May25_04-52-49_1c65441e8d75/1684990380.414929/events.out.tfevents.1684990380.1c65441e8d75.6663.1 +3 -0
- runs/May25_04-52-49_1c65441e8d75/1684990517.654749/events.out.tfevents.1684990517.1c65441e8d75.6663.2 +3 -0
- runs/May25_04-52-49_1c65441e8d75/events.out.tfevents.1684990380.1c65441e8d75.6663.0 +3 -0
- runs/May25_04-55-31_1c65441e8d75/1684990539.6935906/events.out.tfevents.1684990539.1c65441e8d75.6663.4 +3 -0
- runs/May25_04-55-31_1c65441e8d75/events.out.tfevents.1684990539.1c65441e8d75.6663.3 +3 -0
- runs/May25_04-56-15_1c65441e8d75/1684990582.9919426/events.out.tfevents.1684990582.1c65441e8d75.6663.6 +3 -0
- runs/May25_04-56-15_1c65441e8d75/events.out.tfevents.1684990582.1c65441e8d75.6663.5 +3 -0
- runs/May25_04-56-38_1c65441e8d75/1684990605.992353/events.out.tfevents.1684990605.1c65441e8d75.6663.8 +3 -0
- runs/May25_04-56-38_1c65441e8d75/events.out.tfevents.1684990605.1c65441e8d75.6663.7 +3 -0
- runs/May25_04-57-02_1c65441e8d75/1684990629.985542/events.out.tfevents.1684990629.1c65441e8d75.6663.10 +3 -0
- runs/May25_04-57-02_1c65441e8d75/events.out.tfevents.1684990629.1c65441e8d75.6663.9 +3 -0
- special_tokens_map.json +56 -0
- tokenizer.json +0 -0
- tokenizer_config.json +69 -0
- training_args.bin +3 -0
- vocab.json +0 -0
.gitignore
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
checkpoint-*/
|
added_tokens.json
ADDED
@@ -0,0 +1,5 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"<EV>": 50265,
|
3 |
+
"<abs>": 50267,
|
4 |
+
"<t>": 50266
|
5 |
+
}
|
config.json
ADDED
@@ -0,0 +1,68 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "hyesunyun/update-summarization-bart-large-longformer",
|
3 |
+
"_num_labels": 3,
|
4 |
+
"activation_dropout": 0.0,
|
5 |
+
"activation_function": "gelu",
|
6 |
+
"architectures": [
|
7 |
+
"LEDForConditionalGeneration"
|
8 |
+
],
|
9 |
+
"attention_dropout": 0.0,
|
10 |
+
"attention_window": [
|
11 |
+
1024,
|
12 |
+
1024,
|
13 |
+
1024,
|
14 |
+
1024,
|
15 |
+
1024,
|
16 |
+
1024,
|
17 |
+
1024,
|
18 |
+
1024,
|
19 |
+
1024,
|
20 |
+
1024,
|
21 |
+
1024,
|
22 |
+
1024
|
23 |
+
],
|
24 |
+
"bos_token_id": 0,
|
25 |
+
"classif_dropout": 0.0,
|
26 |
+
"classifier_dropout": 0.0,
|
27 |
+
"d_model": 1024,
|
28 |
+
"decoder_attention_heads": 16,
|
29 |
+
"decoder_ffn_dim": 4096,
|
30 |
+
"decoder_layerdrop": 0.0,
|
31 |
+
"decoder_layers": 12,
|
32 |
+
"decoder_start_token_id": 2,
|
33 |
+
"dropout": 0.1,
|
34 |
+
"early_stopping": true,
|
35 |
+
"encoder_attention_heads": 16,
|
36 |
+
"encoder_ffn_dim": 4096,
|
37 |
+
"encoder_layerdrop": 0.0,
|
38 |
+
"encoder_layers": 12,
|
39 |
+
"eos_token_id": 2,
|
40 |
+
"id2label": {
|
41 |
+
"0": "LABEL_0",
|
42 |
+
"1": "LABEL_1",
|
43 |
+
"2": "LABEL_2"
|
44 |
+
},
|
45 |
+
"init_std": 0.02,
|
46 |
+
"is_encoder_decoder": true,
|
47 |
+
"label2id": {
|
48 |
+
"LABEL_0": 0,
|
49 |
+
"LABEL_1": 1,
|
50 |
+
"LABEL_2": 2
|
51 |
+
},
|
52 |
+
"length_penalty": 2.0,
|
53 |
+
"max_decoder_position_embeddings": 1024,
|
54 |
+
"max_encoder_position_embeddings": 16384,
|
55 |
+
"max_length": 512,
|
56 |
+
"min_length": 100,
|
57 |
+
"model_type": "led",
|
58 |
+
"no_repeat_ngram_size": 3,
|
59 |
+
"num_beams": 2,
|
60 |
+
"num_hidden_layers": 12,
|
61 |
+
"output_past": false,
|
62 |
+
"pad_token_id": 1,
|
63 |
+
"prefix": " ",
|
64 |
+
"torch_dtype": "float32",
|
65 |
+
"transformers_version": "4.29.2",
|
66 |
+
"use_cache": false,
|
67 |
+
"vocab_size": 50268
|
68 |
+
}
|
merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3aa480c63e471ff5fa51ad9cdcdaa2607f9d3af6ea51208c7a9abdf534f414df
|
3 |
+
size 1839621037
|
runs/May25_04-52-49_1c65441e8d75/1684990380.414929/events.out.tfevents.1684990380.1c65441e8d75.6663.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b686d1d2e3ef14da0d5e384b5e66e30cb9736fae046889f0994e9b6a132142aa
|
3 |
+
size 6225
|
runs/May25_04-52-49_1c65441e8d75/1684990517.654749/events.out.tfevents.1684990517.1c65441e8d75.6663.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96fe43111de61197de7a044f74a407fb37965659cdb487706a96f8ac7d2cd0f1
|
3 |
+
size 6225
|
runs/May25_04-52-49_1c65441e8d75/events.out.tfevents.1684990380.1c65441e8d75.6663.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5c5711c59b542e9e015003bdc854f5d18647e542cd2a675bba5f49ae92443a83
|
3 |
+
size 9810
|
runs/May25_04-55-31_1c65441e8d75/1684990539.6935906/events.out.tfevents.1684990539.1c65441e8d75.6663.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:efb794b8d719abcbc699ade38abc3cff702c97d2770066f13dd2cf320f34e479
|
3 |
+
size 6225
|
runs/May25_04-55-31_1c65441e8d75/events.out.tfevents.1684990539.1c65441e8d75.6663.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ae49314e1e736695612ec89f4bd8092e044d5a765e3e549e971b27a6e7557b7e
|
3 |
+
size 5101
|
runs/May25_04-56-15_1c65441e8d75/1684990582.9919426/events.out.tfevents.1684990582.1c65441e8d75.6663.6
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f74234ba192a6f79543a59eefe90715e07534ba9738e1aadd0ae400348babe9c
|
3 |
+
size 6225
|
runs/May25_04-56-15_1c65441e8d75/events.out.tfevents.1684990582.1c65441e8d75.6663.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d89032e107fb58bb27e6a60e03dac12063917a85ba23d01a14ccbb534f2976f
|
3 |
+
size 4947
|
runs/May25_04-56-38_1c65441e8d75/1684990605.992353/events.out.tfevents.1684990605.1c65441e8d75.6663.8
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9d10919bb9556e65c776792783d9d0e4efa8dcc37bb2f1bc2f903ba5ff2b66e0
|
3 |
+
size 6225
|
runs/May25_04-56-38_1c65441e8d75/events.out.tfevents.1684990605.1c65441e8d75.6663.7
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6d0eb3bb88dbc66cada69a1a502be371b309cab4f66668b12f9c63eaeb9d5600
|
3 |
+
size 4947
|
runs/May25_04-57-02_1c65441e8d75/1684990629.985542/events.out.tfevents.1684990629.1c65441e8d75.6663.10
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:11c3bd841d082a2367be959a0a3c7c8d71d6a118c6fef204094d5e97c3ce7194
|
3 |
+
size 6225
|
runs/May25_04-57-02_1c65441e8d75/events.out.tfevents.1684990629.1c65441e8d75.6663.9
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:01b4fd90861205b6ba3c34c864875d6fab2c94a105a3b5e2d0827e68cedaeda1
|
3 |
+
size 5616
|
special_tokens_map.json
ADDED
@@ -0,0 +1,56 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"additional_special_tokens": [
|
3 |
+
"<EV>",
|
4 |
+
"<t>",
|
5 |
+
"<abs>"
|
6 |
+
],
|
7 |
+
"bos_token": {
|
8 |
+
"content": "<s>",
|
9 |
+
"lstrip": false,
|
10 |
+
"normalized": true,
|
11 |
+
"rstrip": false,
|
12 |
+
"single_word": false
|
13 |
+
},
|
14 |
+
"cls_token": {
|
15 |
+
"content": "<s>",
|
16 |
+
"lstrip": false,
|
17 |
+
"normalized": true,
|
18 |
+
"rstrip": false,
|
19 |
+
"single_word": false
|
20 |
+
},
|
21 |
+
"eos_token": {
|
22 |
+
"content": "</s>",
|
23 |
+
"lstrip": false,
|
24 |
+
"normalized": true,
|
25 |
+
"rstrip": false,
|
26 |
+
"single_word": false
|
27 |
+
},
|
28 |
+
"mask_token": {
|
29 |
+
"content": "<mask>",
|
30 |
+
"lstrip": true,
|
31 |
+
"normalized": true,
|
32 |
+
"rstrip": false,
|
33 |
+
"single_word": false
|
34 |
+
},
|
35 |
+
"pad_token": {
|
36 |
+
"content": "<pad>",
|
37 |
+
"lstrip": false,
|
38 |
+
"normalized": true,
|
39 |
+
"rstrip": false,
|
40 |
+
"single_word": false
|
41 |
+
},
|
42 |
+
"sep_token": {
|
43 |
+
"content": "</s>",
|
44 |
+
"lstrip": false,
|
45 |
+
"normalized": true,
|
46 |
+
"rstrip": false,
|
47 |
+
"single_word": false
|
48 |
+
},
|
49 |
+
"unk_token": {
|
50 |
+
"content": "<unk>",
|
51 |
+
"lstrip": false,
|
52 |
+
"normalized": true,
|
53 |
+
"rstrip": false,
|
54 |
+
"single_word": false
|
55 |
+
}
|
56 |
+
}
|
tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer_config.json
ADDED
@@ -0,0 +1,69 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"add_prefix_space": false,
|
3 |
+
"additional_special_tokens": [
|
4 |
+
"<EV>",
|
5 |
+
"<t>",
|
6 |
+
"<abs>"
|
7 |
+
],
|
8 |
+
"bos_token": {
|
9 |
+
"__type": "AddedToken",
|
10 |
+
"content": "<s>",
|
11 |
+
"lstrip": false,
|
12 |
+
"normalized": true,
|
13 |
+
"rstrip": false,
|
14 |
+
"single_word": false
|
15 |
+
},
|
16 |
+
"clean_up_tokenization_spaces": true,
|
17 |
+
"cls_token": {
|
18 |
+
"__type": "AddedToken",
|
19 |
+
"content": "<s>",
|
20 |
+
"lstrip": false,
|
21 |
+
"normalized": true,
|
22 |
+
"rstrip": false,
|
23 |
+
"single_word": false
|
24 |
+
},
|
25 |
+
"eos_token": {
|
26 |
+
"__type": "AddedToken",
|
27 |
+
"content": "</s>",
|
28 |
+
"lstrip": false,
|
29 |
+
"normalized": true,
|
30 |
+
"rstrip": false,
|
31 |
+
"single_word": false
|
32 |
+
},
|
33 |
+
"errors": "replace",
|
34 |
+
"mask_token": {
|
35 |
+
"__type": "AddedToken",
|
36 |
+
"content": "<mask>",
|
37 |
+
"lstrip": true,
|
38 |
+
"normalized": true,
|
39 |
+
"rstrip": false,
|
40 |
+
"single_word": false
|
41 |
+
},
|
42 |
+
"model_max_length": 16384,
|
43 |
+
"pad_token": {
|
44 |
+
"__type": "AddedToken",
|
45 |
+
"content": "<pad>",
|
46 |
+
"lstrip": false,
|
47 |
+
"normalized": true,
|
48 |
+
"rstrip": false,
|
49 |
+
"single_word": false
|
50 |
+
},
|
51 |
+
"sep_token": {
|
52 |
+
"__type": "AddedToken",
|
53 |
+
"content": "</s>",
|
54 |
+
"lstrip": false,
|
55 |
+
"normalized": true,
|
56 |
+
"rstrip": false,
|
57 |
+
"single_word": false
|
58 |
+
},
|
59 |
+
"tokenizer_class": "LEDTokenizer",
|
60 |
+
"trim_offsets": true,
|
61 |
+
"unk_token": {
|
62 |
+
"__type": "AddedToken",
|
63 |
+
"content": "<unk>",
|
64 |
+
"lstrip": false,
|
65 |
+
"normalized": true,
|
66 |
+
"rstrip": false,
|
67 |
+
"single_word": false
|
68 |
+
}
|
69 |
+
}
|
training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f87681d3221346557535e6e6bde3909756446cfb67b22a648ed393ec19b08fb3
|
3 |
+
size 4091
|
vocab.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|