ThuyNT03 commited on
Commit
8412d30
1 Parent(s): 5dbfba8

Training completed!

Browse files
README.md CHANGED
@@ -1,5 +1,5 @@
1
  ---
2
- base_model: vinai/phobert-base-v2
3
  tags:
4
  - generated_from_trainer
5
  metrics:
@@ -15,9 +15,9 @@ should probably proofread and complete it, then remove this comment. -->
15
 
16
  # PhoBERT-cls-detail-in-Non_OCR
17
 
18
- This model is a fine-tuned version of [vinai/phobert-base-v2](https://huggingface.co/vinai/phobert-base-v2) on the None dataset.
19
  It achieves the following results on the evaluation set:
20
- - Loss: 0.3171
21
  - Accuracy: 0.95
22
  - F1: 0.9359
23
 
@@ -44,25 +44,24 @@ The following hyperparameters were used during training:
44
  - seed: 42
45
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
46
  - lr_scheduler_type: linear
47
- - num_epochs: 8
48
 
49
  ### Training results
50
 
51
  | Training Loss | Epoch | Step | Validation Loss | Accuracy | F1 |
52
  |:-------------:|:-----:|:----:|:---------------:|:--------:|:------:|
53
- | 1.5232 | 1.0 | 25 | 1.1976 | 0.79 | 0.7209 |
54
- | 1.0392 | 2.0 | 50 | 0.7550 | 0.91 | 0.8830 |
55
- | 0.6986 | 3.0 | 75 | 0.5119 | 0.92 | 0.8928 |
56
- | 0.5144 | 4.0 | 100 | 0.4181 | 0.92 | 0.8928 |
57
- | 0.4265 | 5.0 | 125 | 0.3602 | 0.95 | 0.9359 |
58
- | 0.3618 | 6.0 | 150 | 0.3394 | 0.95 | 0.9359 |
59
- | 0.3196 | 7.0 | 175 | 0.3218 | 0.95 | 0.9359 |
60
- | 0.2982 | 8.0 | 200 | 0.3171 | 0.95 | 0.9359 |
61
 
62
 
63
  ### Framework versions
64
 
65
- - Transformers 4.33.3
66
  - Pytorch 2.0.1+cu118
67
  - Datasets 2.14.5
68
- - Tokenizers 0.13.3
 
1
  ---
2
+ base_model: vinai/phobert-base
3
  tags:
4
  - generated_from_trainer
5
  metrics:
 
15
 
16
  # PhoBERT-cls-detail-in-Non_OCR
17
 
18
+ This model is a fine-tuned version of [vinai/phobert-base](https://huggingface.co/vinai/phobert-base) on the None dataset.
19
  It achieves the following results on the evaluation set:
20
+ - Loss: 0.2965
21
  - Accuracy: 0.95
22
  - F1: 0.9359
23
 
 
44
  - seed: 42
45
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
46
  - lr_scheduler_type: linear
47
+ - num_epochs: 7
48
 
49
  ### Training results
50
 
51
  | Training Loss | Epoch | Step | Validation Loss | Accuracy | F1 |
52
  |:-------------:|:-----:|:----:|:---------------:|:--------:|:------:|
53
+ | 1.5312 | 1.0 | 25 | 1.2681 | 0.55 | 0.4060 |
54
+ | 1.1478 | 2.0 | 50 | 0.8709 | 0.82 | 0.7465 |
55
+ | 0.7779 | 3.0 | 75 | 0.5259 | 0.92 | 0.8928 |
56
+ | 0.528 | 4.0 | 100 | 0.3918 | 0.92 | 0.8928 |
57
+ | 0.4236 | 5.0 | 125 | 0.3363 | 0.94 | 0.9254 |
58
+ | 0.3641 | 6.0 | 150 | 0.3035 | 0.95 | 0.9359 |
59
+ | 0.3356 | 7.0 | 175 | 0.2965 | 0.95 | 0.9359 |
 
60
 
61
 
62
  ### Framework versions
63
 
64
+ - Transformers 4.34.0
65
  - Pytorch 2.0.1+cu118
66
  - Datasets 2.14.5
67
+ - Tokenizers 0.14.1
added_tokens.json CHANGED
@@ -1,3 +1,7 @@
1
  {
2
- "<mask>": 64000
 
 
 
 
3
  }
 
1
  {
2
+ "</s>": 2,
3
+ "<mask>": 64000,
4
+ "<pad>": 1,
5
+ "<s>": 0,
6
+ "<unk>": 3
7
  }
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "vinai/phobert-base-v2",
3
  "architectures": [
4
  "RobertaForSequenceClassification"
5
  ],
@@ -7,6 +7,7 @@
7
  "bos_token_id": 0,
8
  "classifier_dropout": null,
9
  "eos_token_id": 2,
 
10
  "hidden_act": "gelu",
11
  "hidden_dropout_prob": 0.1,
12
  "hidden_size": 768,
@@ -38,7 +39,7 @@
38
  "problem_type": "single_label_classification",
39
  "tokenizer_class": "PhobertTokenizer",
40
  "torch_dtype": "float32",
41
- "transformers_version": "4.33.3",
42
  "type_vocab_size": 1,
43
  "use_cache": true,
44
  "vocab_size": 64001
 
1
  {
2
+ "_name_or_path": "vinai/phobert-base",
3
  "architectures": [
4
  "RobertaForSequenceClassification"
5
  ],
 
7
  "bos_token_id": 0,
8
  "classifier_dropout": null,
9
  "eos_token_id": 2,
10
+ "gradient_checkpointing": false,
11
  "hidden_act": "gelu",
12
  "hidden_dropout_prob": 0.1,
13
  "hidden_size": 768,
 
39
  "problem_type": "single_label_classification",
40
  "tokenizer_class": "PhobertTokenizer",
41
  "torch_dtype": "float32",
42
+ "transformers_version": "4.34.0",
43
  "type_vocab_size": 1,
44
  "use_cache": true,
45
  "vocab_size": 64001
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bf04b61da97934148142f76be9fc1dfc13a8f705c4f1fefca4614ef4ed0c8594
3
  size 540080497
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de5997667b22f35807f1161d74db16beeed56c23089220f192420e7fcf5a28f5
3
  size 540080497
tokenizer_config.json CHANGED
@@ -1,4 +1,47 @@
1
  {
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2
  "bos_token": "<s>",
3
  "clean_up_tokenization_spaces": true,
4
  "cls_token": "<s>",
@@ -8,5 +51,6 @@
8
  "pad_token": "<pad>",
9
  "sep_token": "</s>",
10
  "tokenizer_class": "PhobertTokenizer",
 
11
  "unk_token": "<unk>"
12
  }
 
1
  {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "<s>",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "1": {
12
+ "content": "<pad>",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "2": {
20
+ "content": "</s>",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "3": {
28
+ "content": "<unk>",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "64000": {
36
+ "content": "<mask>",
37
+ "lstrip": false,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ }
43
+ },
44
+ "additional_special_tokens": [],
45
  "bos_token": "<s>",
46
  "clean_up_tokenization_spaces": true,
47
  "cls_token": "<s>",
 
51
  "pad_token": "<pad>",
52
  "sep_token": "</s>",
53
  "tokenizer_class": "PhobertTokenizer",
54
+ "tokenizer_file": "/root/.cache/huggingface/hub/models--vinai--phobert-large/snapshots/9ce4eafcd8e601d798295b17c75c5f5f1b1509b9/tokenizer.json",
55
  "unk_token": "<unk>"
56
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:92cd65c70df121f6e89d516f162c48afdb626e0109cbfd5d3595e5fa6bd261b6
3
- size 4027
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6af8aa3f9b6974a88282861a87312175519579d399c4620e4914bc3a1801f07
3
+ size 4091