tushifire commited on
Commit
3d5dca7
1 Parent(s): e7670a6

Training complete

Browse files
README.md ADDED
@@ -0,0 +1,85 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: apache-2.0
3
+ base_model: dslim/distilbert-NER
4
+ tags:
5
+ - generated_from_trainer
6
+ metrics:
7
+ - precision
8
+ - recall
9
+ - f1
10
+ - accuracy
11
+ model-index:
12
+ - name: distilbert-finetuned-ner
13
+ results: []
14
+ ---
15
+
16
+ <!-- This model card has been generated automatically according to the information the Trainer had access to. You
17
+ should probably proofread and complete it, then remove this comment. -->
18
+
19
+ # distilbert-finetuned-ner
20
+
21
+ This model is a fine-tuned version of [dslim/distilbert-NER](https://huggingface.co/dslim/distilbert-NER) on an unknown dataset.
22
+ It achieves the following results on the evaluation set:
23
+ - Loss: 0.4109
24
+ - Precision: 0.6952
25
+ - Recall: 0.7549
26
+ - F1: 0.7238
27
+ - Accuracy: 0.8724
28
+
29
+ ## Model description
30
+
31
+ More information needed
32
+
33
+ ## Intended uses & limitations
34
+
35
+ More information needed
36
+
37
+ ## Training and evaluation data
38
+
39
+ More information needed
40
+
41
+ ## Training procedure
42
+
43
+ ### Training hyperparameters
44
+
45
+ The following hyperparameters were used during training:
46
+ - learning_rate: 1e-06
47
+ - train_batch_size: 8
48
+ - eval_batch_size: 8
49
+ - seed: 42
50
+ - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
51
+ - lr_scheduler_type: linear
52
+ - num_epochs: 20
53
+
54
+ ### Training results
55
+
56
+ | Training Loss | Epoch | Step | Validation Loss | Precision | Recall | F1 | Accuracy |
57
+ |:-------------:|:-----:|:-----:|:---------------:|:---------:|:------:|:------:|:--------:|
58
+ | 1.647 | 1.0 | 977 | 0.8265 | 0.4918 | 0.5741 | 0.5298 | 0.7793 |
59
+ | 0.7697 | 2.0 | 1954 | 0.6350 | 0.5801 | 0.6567 | 0.6160 | 0.8194 |
60
+ | 0.6089 | 3.0 | 2931 | 0.5591 | 0.6138 | 0.6857 | 0.6478 | 0.8352 |
61
+ | 0.534 | 4.0 | 3908 | 0.5163 | 0.6296 | 0.6955 | 0.6609 | 0.8439 |
62
+ | 0.4911 | 5.0 | 4885 | 0.4885 | 0.6436 | 0.7075 | 0.6740 | 0.8498 |
63
+ | 0.4545 | 6.0 | 5862 | 0.4683 | 0.6526 | 0.7165 | 0.6830 | 0.8557 |
64
+ | 0.4379 | 7.0 | 6839 | 0.4534 | 0.6600 | 0.7231 | 0.6901 | 0.8592 |
65
+ | 0.4124 | 8.0 | 7816 | 0.4441 | 0.6713 | 0.7274 | 0.6982 | 0.8625 |
66
+ | 0.403 | 9.0 | 8793 | 0.4345 | 0.6746 | 0.7359 | 0.7039 | 0.8658 |
67
+ | 0.394 | 10.0 | 9770 | 0.4324 | 0.6835 | 0.7445 | 0.7127 | 0.8667 |
68
+ | 0.3782 | 11.0 | 10747 | 0.4256 | 0.6820 | 0.7465 | 0.7128 | 0.8678 |
69
+ | 0.3706 | 12.0 | 11724 | 0.4213 | 0.6873 | 0.7460 | 0.7155 | 0.8691 |
70
+ | 0.3712 | 13.0 | 12701 | 0.4197 | 0.6873 | 0.7518 | 0.7181 | 0.8703 |
71
+ | 0.3626 | 14.0 | 13678 | 0.4163 | 0.6882 | 0.7523 | 0.7188 | 0.8713 |
72
+ | 0.351 | 15.0 | 14655 | 0.4142 | 0.6905 | 0.7528 | 0.7203 | 0.8717 |
73
+ | 0.3528 | 16.0 | 15632 | 0.4142 | 0.6932 | 0.7538 | 0.7222 | 0.8718 |
74
+ | 0.3523 | 17.0 | 16609 | 0.4123 | 0.6949 | 0.7533 | 0.7229 | 0.8722 |
75
+ | 0.3464 | 18.0 | 17586 | 0.4107 | 0.6936 | 0.7538 | 0.7224 | 0.8727 |
76
+ | 0.342 | 19.0 | 18563 | 0.4115 | 0.6954 | 0.7560 | 0.7244 | 0.8726 |
77
+ | 0.3496 | 20.0 | 19540 | 0.4109 | 0.6952 | 0.7549 | 0.7238 | 0.8724 |
78
+
79
+
80
+ ### Framework versions
81
+
82
+ - Transformers 4.41.1
83
+ - Pytorch 2.3.0+cu121
84
+ - Datasets 2.19.1
85
+ - Tokenizers 0.19.1
config.json ADDED
@@ -0,0 +1,79 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "dslim/distilbert-NER",
3
+ "activation": "gelu",
4
+ "architectures": [
5
+ "DistilBertForTokenClassification"
6
+ ],
7
+ "attention_dropout": 0.1,
8
+ "dim": 768,
9
+ "dropout": 0.1,
10
+ "hidden_dim": 3072,
11
+ "id2label": {
12
+ "0": "B-Actor",
13
+ "1": "I-Actor",
14
+ "2": "O",
15
+ "3": "B-Plot",
16
+ "4": "I-Plot",
17
+ "5": "B-Opinion",
18
+ "6": "I-Opinion",
19
+ "7": "B-Award",
20
+ "8": "I-Award",
21
+ "9": "B-Year",
22
+ "10": "B-Genre",
23
+ "11": "B-Origin",
24
+ "12": "I-Origin",
25
+ "13": "B-Director",
26
+ "14": "I-Director",
27
+ "15": "I-Genre",
28
+ "16": "I-Year",
29
+ "17": "B-Soundtrack",
30
+ "18": "I-Soundtrack",
31
+ "19": "B-Relationship",
32
+ "20": "I-Relationship",
33
+ "21": "B-Character_Name",
34
+ "22": "I-Character_Name",
35
+ "23": "B-Quote",
36
+ "24": "I-Quote"
37
+ },
38
+ "initializer_range": 0.02,
39
+ "label2id": {
40
+ "B-Actor": 0,
41
+ "B-Award": 7,
42
+ "B-Character_Name": 21,
43
+ "B-Director": 13,
44
+ "B-Genre": 10,
45
+ "B-Opinion": 5,
46
+ "B-Origin": 11,
47
+ "B-Plot": 3,
48
+ "B-Quote": 23,
49
+ "B-Relationship": 19,
50
+ "B-Soundtrack": 17,
51
+ "B-Year": 9,
52
+ "I-Actor": 1,
53
+ "I-Award": 8,
54
+ "I-Character_Name": 22,
55
+ "I-Director": 14,
56
+ "I-Genre": 15,
57
+ "I-Opinion": 6,
58
+ "I-Origin": 12,
59
+ "I-Plot": 4,
60
+ "I-Quote": 24,
61
+ "I-Relationship": 20,
62
+ "I-Soundtrack": 18,
63
+ "I-Year": 16,
64
+ "O": 2
65
+ },
66
+ "max_position_embeddings": 512,
67
+ "model_type": "distilbert",
68
+ "n_heads": 12,
69
+ "n_layers": 6,
70
+ "output_past": true,
71
+ "pad_token_id": 0,
72
+ "qa_dropout": 0.1,
73
+ "seq_classif_dropout": 0.2,
74
+ "sinusoidal_pos_embds": false,
75
+ "tie_weights_": true,
76
+ "torch_dtype": "float32",
77
+ "transformers_version": "4.41.1",
78
+ "vocab_size": 28996
79
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b67822b905e1a2549036addb2f40af083414c7cf2e3d448fba7864dbceb61bd
3
+ size 260852884
runs/May29_00-40-55_deda405e21c0/events.out.tfevents.1716943258.deda405e21c0.512.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40f9c3a64b68d5a298eac7a40c9d011a550b49ca6aafc9e274d2c19c7658f634
3
+ size 23970
special_tokens_map.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": {
3
+ "content": "[CLS]",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "mask_token": {
10
+ "content": "[MASK]",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": {
17
+ "content": "[PAD]",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "sep_token": {
24
+ "content": "[SEP]",
25
+ "lstrip": false,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ },
30
+ "unk_token": {
31
+ "content": "[UNK]",
32
+ "lstrip": false,
33
+ "normalized": false,
34
+ "rstrip": false,
35
+ "single_word": false
36
+ }
37
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,59 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "[PAD]",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "100": {
12
+ "content": "[UNK]",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "101": {
20
+ "content": "[CLS]",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "102": {
28
+ "content": "[SEP]",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "103": {
36
+ "content": "[MASK]",
37
+ "lstrip": false,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ }
43
+ },
44
+ "clean_up_tokenization_spaces": true,
45
+ "cls_token": "[CLS]",
46
+ "do_lower_case": false,
47
+ "mask_token": "[MASK]",
48
+ "max_length": 512,
49
+ "model_max_length": 512,
50
+ "pad_token": "[PAD]",
51
+ "sep_token": "[SEP]",
52
+ "stride": 0,
53
+ "strip_accents": null,
54
+ "tokenize_chinese_chars": true,
55
+ "tokenizer_class": "DistilBertTokenizer",
56
+ "truncation_side": "right",
57
+ "truncation_strategy": "longest_first",
58
+ "unk_token": "[UNK]"
59
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9b9654a2c6d1063cc7ca3416469378cfa04fddd59eb06a3ae4f2fcbfcc6e7231
3
+ size 5112
vocab.txt ADDED
The diff for this file is too large to render. See raw diff