marcus2000 commited on
Commit
679a442
1 Parent(s): 41e15c7

Training in progress, step 1

Browse files
.gitignore ADDED
@@ -0,0 +1 @@
 
 
1
+ checkpoint-*/
added_tokens.json ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ {
2
+ "<EV>": 50265,
3
+ "<abs>": 50267,
4
+ "<t>": 50266
5
+ }
config.json ADDED
@@ -0,0 +1,68 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "hyesunyun/update-summarization-bart-large-longformer",
3
+ "_num_labels": 3,
4
+ "activation_dropout": 0.0,
5
+ "activation_function": "gelu",
6
+ "architectures": [
7
+ "LEDForConditionalGeneration"
8
+ ],
9
+ "attention_dropout": 0.0,
10
+ "attention_window": [
11
+ 1024,
12
+ 1024,
13
+ 1024,
14
+ 1024,
15
+ 1024,
16
+ 1024,
17
+ 1024,
18
+ 1024,
19
+ 1024,
20
+ 1024,
21
+ 1024,
22
+ 1024
23
+ ],
24
+ "bos_token_id": 0,
25
+ "classif_dropout": 0.0,
26
+ "classifier_dropout": 0.0,
27
+ "d_model": 1024,
28
+ "decoder_attention_heads": 16,
29
+ "decoder_ffn_dim": 4096,
30
+ "decoder_layerdrop": 0.0,
31
+ "decoder_layers": 12,
32
+ "decoder_start_token_id": 2,
33
+ "dropout": 0.1,
34
+ "early_stopping": true,
35
+ "encoder_attention_heads": 16,
36
+ "encoder_ffn_dim": 4096,
37
+ "encoder_layerdrop": 0.0,
38
+ "encoder_layers": 12,
39
+ "eos_token_id": 2,
40
+ "id2label": {
41
+ "0": "LABEL_0",
42
+ "1": "LABEL_1",
43
+ "2": "LABEL_2"
44
+ },
45
+ "init_std": 0.02,
46
+ "is_encoder_decoder": true,
47
+ "label2id": {
48
+ "LABEL_0": 0,
49
+ "LABEL_1": 1,
50
+ "LABEL_2": 2
51
+ },
52
+ "length_penalty": 2.0,
53
+ "max_decoder_position_embeddings": 1024,
54
+ "max_encoder_position_embeddings": 16384,
55
+ "max_length": 512,
56
+ "min_length": 100,
57
+ "model_type": "led",
58
+ "no_repeat_ngram_size": 3,
59
+ "num_beams": 2,
60
+ "num_hidden_layers": 12,
61
+ "output_past": false,
62
+ "pad_token_id": 1,
63
+ "prefix": " ",
64
+ "torch_dtype": "float32",
65
+ "transformers_version": "4.29.2",
66
+ "use_cache": false,
67
+ "vocab_size": 50268
68
+ }
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3aa480c63e471ff5fa51ad9cdcdaa2607f9d3af6ea51208c7a9abdf534f414df
3
+ size 1839621037
runs/May25_04-52-49_1c65441e8d75/1684990380.414929/events.out.tfevents.1684990380.1c65441e8d75.6663.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b686d1d2e3ef14da0d5e384b5e66e30cb9736fae046889f0994e9b6a132142aa
3
+ size 6225
runs/May25_04-52-49_1c65441e8d75/1684990517.654749/events.out.tfevents.1684990517.1c65441e8d75.6663.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96fe43111de61197de7a044f74a407fb37965659cdb487706a96f8ac7d2cd0f1
3
+ size 6225
runs/May25_04-52-49_1c65441e8d75/events.out.tfevents.1684990380.1c65441e8d75.6663.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c5711c59b542e9e015003bdc854f5d18647e542cd2a675bba5f49ae92443a83
3
+ size 9810
runs/May25_04-55-31_1c65441e8d75/1684990539.6935906/events.out.tfevents.1684990539.1c65441e8d75.6663.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:efb794b8d719abcbc699ade38abc3cff702c97d2770066f13dd2cf320f34e479
3
+ size 6225
runs/May25_04-55-31_1c65441e8d75/events.out.tfevents.1684990539.1c65441e8d75.6663.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae49314e1e736695612ec89f4bd8092e044d5a765e3e549e971b27a6e7557b7e
3
+ size 5101
runs/May25_04-56-15_1c65441e8d75/1684990582.9919426/events.out.tfevents.1684990582.1c65441e8d75.6663.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f74234ba192a6f79543a59eefe90715e07534ba9738e1aadd0ae400348babe9c
3
+ size 6225
runs/May25_04-56-15_1c65441e8d75/events.out.tfevents.1684990582.1c65441e8d75.6663.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d89032e107fb58bb27e6a60e03dac12063917a85ba23d01a14ccbb534f2976f
3
+ size 4947
runs/May25_04-56-38_1c65441e8d75/1684990605.992353/events.out.tfevents.1684990605.1c65441e8d75.6663.8 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d10919bb9556e65c776792783d9d0e4efa8dcc37bb2f1bc2f903ba5ff2b66e0
3
+ size 6225
runs/May25_04-56-38_1c65441e8d75/events.out.tfevents.1684990605.1c65441e8d75.6663.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d0eb3bb88dbc66cada69a1a502be371b309cab4f66668b12f9c63eaeb9d5600
3
+ size 4947
runs/May25_04-57-02_1c65441e8d75/1684990629.985542/events.out.tfevents.1684990629.1c65441e8d75.6663.10 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11c3bd841d082a2367be959a0a3c7c8d71d6a118c6fef204094d5e97c3ce7194
3
+ size 6225
runs/May25_04-57-02_1c65441e8d75/events.out.tfevents.1684990629.1c65441e8d75.6663.9 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01b4fd90861205b6ba3c34c864875d6fab2c94a105a3b5e2d0827e68cedaeda1
3
+ size 5616
special_tokens_map.json ADDED
@@ -0,0 +1,56 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<EV>",
4
+ "<t>",
5
+ "<abs>"
6
+ ],
7
+ "bos_token": {
8
+ "content": "<s>",
9
+ "lstrip": false,
10
+ "normalized": true,
11
+ "rstrip": false,
12
+ "single_word": false
13
+ },
14
+ "cls_token": {
15
+ "content": "<s>",
16
+ "lstrip": false,
17
+ "normalized": true,
18
+ "rstrip": false,
19
+ "single_word": false
20
+ },
21
+ "eos_token": {
22
+ "content": "</s>",
23
+ "lstrip": false,
24
+ "normalized": true,
25
+ "rstrip": false,
26
+ "single_word": false
27
+ },
28
+ "mask_token": {
29
+ "content": "<mask>",
30
+ "lstrip": true,
31
+ "normalized": true,
32
+ "rstrip": false,
33
+ "single_word": false
34
+ },
35
+ "pad_token": {
36
+ "content": "<pad>",
37
+ "lstrip": false,
38
+ "normalized": true,
39
+ "rstrip": false,
40
+ "single_word": false
41
+ },
42
+ "sep_token": {
43
+ "content": "</s>",
44
+ "lstrip": false,
45
+ "normalized": true,
46
+ "rstrip": false,
47
+ "single_word": false
48
+ },
49
+ "unk_token": {
50
+ "content": "<unk>",
51
+ "lstrip": false,
52
+ "normalized": true,
53
+ "rstrip": false,
54
+ "single_word": false
55
+ }
56
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,69 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "additional_special_tokens": [
4
+ "<EV>",
5
+ "<t>",
6
+ "<abs>"
7
+ ],
8
+ "bos_token": {
9
+ "__type": "AddedToken",
10
+ "content": "<s>",
11
+ "lstrip": false,
12
+ "normalized": true,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "clean_up_tokenization_spaces": true,
17
+ "cls_token": {
18
+ "__type": "AddedToken",
19
+ "content": "<s>",
20
+ "lstrip": false,
21
+ "normalized": true,
22
+ "rstrip": false,
23
+ "single_word": false
24
+ },
25
+ "eos_token": {
26
+ "__type": "AddedToken",
27
+ "content": "</s>",
28
+ "lstrip": false,
29
+ "normalized": true,
30
+ "rstrip": false,
31
+ "single_word": false
32
+ },
33
+ "errors": "replace",
34
+ "mask_token": {
35
+ "__type": "AddedToken",
36
+ "content": "<mask>",
37
+ "lstrip": true,
38
+ "normalized": true,
39
+ "rstrip": false,
40
+ "single_word": false
41
+ },
42
+ "model_max_length": 16384,
43
+ "pad_token": {
44
+ "__type": "AddedToken",
45
+ "content": "<pad>",
46
+ "lstrip": false,
47
+ "normalized": true,
48
+ "rstrip": false,
49
+ "single_word": false
50
+ },
51
+ "sep_token": {
52
+ "__type": "AddedToken",
53
+ "content": "</s>",
54
+ "lstrip": false,
55
+ "normalized": true,
56
+ "rstrip": false,
57
+ "single_word": false
58
+ },
59
+ "tokenizer_class": "LEDTokenizer",
60
+ "trim_offsets": true,
61
+ "unk_token": {
62
+ "__type": "AddedToken",
63
+ "content": "<unk>",
64
+ "lstrip": false,
65
+ "normalized": true,
66
+ "rstrip": false,
67
+ "single_word": false
68
+ }
69
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f87681d3221346557535e6e6bde3909756446cfb67b22a648ed393ec19b08fb3
3
+ size 4091
vocab.json ADDED
The diff for this file is too large to render. See raw diff