tm21cy commited on
Commit
04b0625
·
verified ·
1 Parent(s): 754360c

End of training

Browse files
README.md CHANGED
@@ -1,13 +1,28 @@
1
  ---
2
  license: apache-2.0
3
- base_model: albert-base-v2
4
  tags:
5
  - generated_from_trainer
 
 
6
  metrics:
7
  - accuracy
8
  model-index:
9
  - name: results
10
- results: []
 
 
 
 
 
 
 
 
 
 
 
 
 
11
  ---
12
 
13
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -15,10 +30,10 @@ should probably proofread and complete it, then remove this comment. -->
15
 
16
  # results
17
 
18
- This model is a fine-tuned version of [albert-base-v2](https://huggingface.co/albert-base-v2) on an unknown dataset.
19
  It achieves the following results on the evaluation set:
20
- - Loss: 0.7940
21
- - Accuracy: 0.6556
22
 
23
  ## Model description
24
 
@@ -37,22 +52,21 @@ More information needed
37
  ### Training hyperparameters
38
 
39
  The following hyperparameters were used during training:
40
- - learning_rate: 7.45e-06
41
  - train_batch_size: 16
42
  - eval_batch_size: 16
43
  - seed: 42
44
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
45
  - lr_scheduler_type: linear
46
- - num_epochs: 4
47
 
48
  ### Training results
49
 
50
  | Training Loss | Epoch | Step | Validation Loss | Accuracy |
51
  |:-------------:|:-----:|:----:|:---------------:|:--------:|
52
- | No log | 1.0 | 179 | 0.6503 | 0.6492 |
53
- | No log | 2.0 | 358 | 0.7322 | 0.6565 |
54
- | 0.4518 | 3.0 | 537 | 0.7242 | 0.6649 |
55
- | 0.4518 | 4.0 | 716 | 0.7997 | 0.6586 |
56
 
57
 
58
  ### Framework versions
 
1
  ---
2
  license: apache-2.0
3
+ base_model: distilbert-base-uncased
4
  tags:
5
  - generated_from_trainer
6
+ datasets:
7
+ - emotion
8
  metrics:
9
  - accuracy
10
  model-index:
11
  - name: results
12
+ results:
13
+ - task:
14
+ name: Text Classification
15
+ type: text-classification
16
+ dataset:
17
+ name: emotion
18
+ type: emotion
19
+ config: split
20
+ split: validation
21
+ args: split
22
+ metrics:
23
+ - name: Accuracy
24
+ type: accuracy
25
+ value: 0.927
26
  ---
27
 
28
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
30
 
31
  # results
32
 
33
+ This model is a fine-tuned version of [distilbert-base-uncased](https://huggingface.co/distilbert-base-uncased) on the emotion dataset.
34
  It achieves the following results on the evaluation set:
35
+ - Loss: 0.1888
36
+ - Accuracy: 0.927
37
 
38
  ## Model description
39
 
 
52
  ### Training hyperparameters
53
 
54
  The following hyperparameters were used during training:
55
+ - learning_rate: 5e-05
56
  - train_batch_size: 16
57
  - eval_batch_size: 16
58
  - seed: 42
59
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
60
  - lr_scheduler_type: linear
61
+ - num_epochs: 3
62
 
63
  ### Training results
64
 
65
  | Training Loss | Epoch | Step | Validation Loss | Accuracy |
66
  |:-------------:|:-----:|:----:|:---------------:|:--------:|
67
+ | 0.2348 | 1.0 | 1000 | 0.2163 | 0.9255 |
68
+ | 0.1337 | 2.0 | 2000 | 0.1446 | 0.94 |
69
+ | 0.0886 | 3.0 | 3000 | 0.1541 | 0.9425 |
 
70
 
71
 
72
  ### Framework versions
config.json CHANGED
@@ -1,34 +1,41 @@
1
  {
2
- "_name_or_path": "albert-base-v2",
 
3
  "architectures": [
4
- "AlbertForSequenceClassification"
5
  ],
6
- "attention_probs_dropout_prob": 0,
7
- "bos_token_id": 2,
8
- "classifier_dropout_prob": 0.1,
9
- "down_scale_factor": 1,
10
- "embedding_size": 128,
11
- "eos_token_id": 3,
12
- "gap_size": 0,
13
- "hidden_act": "gelu_new",
14
- "hidden_dropout_prob": 0,
15
- "hidden_size": 768,
 
 
16
  "initializer_range": 0.02,
17
- "inner_group_num": 1,
18
- "intermediate_size": 3072,
19
- "layer_norm_eps": 1e-12,
 
 
 
 
 
20
  "max_position_embeddings": 512,
21
- "model_type": "albert",
22
- "net_structure_type": 0,
23
- "num_attention_heads": 12,
24
- "num_hidden_groups": 1,
25
- "num_hidden_layers": 12,
26
- "num_memory_blocks": 0,
27
  "pad_token_id": 0,
28
- "position_embedding_type": "absolute",
29
  "problem_type": "single_label_classification",
 
 
 
 
30
  "torch_dtype": "float32",
31
  "transformers_version": "4.38.2",
32
- "type_vocab_size": 2,
33
- "vocab_size": 30000
34
  }
 
1
  {
2
+ "_name_or_path": "distilbert-base-uncased",
3
+ "activation": "gelu",
4
  "architectures": [
5
+ "DistilBertForSequenceClassification"
6
  ],
7
+ "attention_dropout": 0.1,
8
+ "dim": 768,
9
+ "dropout": 0.1,
10
+ "hidden_dim": 3072,
11
+ "id2label": {
12
+ "0": "LABEL_0",
13
+ "1": "LABEL_1",
14
+ "2": "LABEL_2",
15
+ "3": "LABEL_3",
16
+ "4": "LABEL_4",
17
+ "5": "LABEL_5"
18
+ },
19
  "initializer_range": 0.02,
20
+ "label2id": {
21
+ "LABEL_0": 0,
22
+ "LABEL_1": 1,
23
+ "LABEL_2": 2,
24
+ "LABEL_3": 3,
25
+ "LABEL_4": 4,
26
+ "LABEL_5": 5
27
+ },
28
  "max_position_embeddings": 512,
29
+ "model_type": "distilbert",
30
+ "n_heads": 12,
31
+ "n_layers": 6,
 
 
 
32
  "pad_token_id": 0,
 
33
  "problem_type": "single_label_classification",
34
+ "qa_dropout": 0.1,
35
+ "seq_classif_dropout": 0.2,
36
+ "sinusoidal_pos_embds": false,
37
+ "tie_weights_": true,
38
  "torch_dtype": "float32",
39
  "transformers_version": "4.38.2",
40
+ "vocab_size": 30522
 
41
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:55c21def950937d603e0c5209b8f4919e6ccd850fa82bf7502bb5b87db480922
3
- size 46743912
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d54e4c4738766f78da46d6cd0dded2a4577f0ccaf3b33bb75a896fb44324668
3
+ size 267844872
runs/Mar11_04-37-43_f6b7ca2de819/events.out.tfevents.1710131875.f6b7ca2de819.11996.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:824c47e6c92aac32a69795f7ac30153a45ff177f942c1ac433199e3864d41486
3
- size 6966
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:036ad2794043d948b8f683a723bd9c0d565d54b8d38606e460db73b2fa313633
3
+ size 7643
runs/Mar11_04-37-43_f6b7ca2de819/events.out.tfevents.1710132833.f6b7ca2de819.11996.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04341eea254b3869f528b833a9e23df03a14efc96c89330f3a7ae95442ebff6d
3
+ size 411
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a89d981b6c77c4b865598567ba8078b5c04cddc89be6ec115b4c0d666b32c9c1
3
  size 4920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75b232ae5b88203fffec359819dd835494a78f15470739cd8dade60135b72c99
3
  size 4920