jsl5710 commited on
Commit
bab5ad9
1 Parent(s): 728ce8b

jslai//content/sample_data/best_models//MBERT_uncased_CrossEntropyLoss_lora

Browse files
README.md CHANGED
@@ -21,12 +21,12 @@ should probably proofread and complete it, then remove this comment. -->
21
 
22
  This model is a fine-tuned version of [google-bert/bert-base-multilingual-uncased](https://huggingface.co/google-bert/bert-base-multilingual-uncased) on the None dataset.
23
  It achieves the following results on the evaluation set:
24
- - Loss: 0.6661
25
- - Accuracy: 0.724
26
- - F1: 0.8399
27
- - Precision: 0.724
28
- - Recall: 1.0
29
- - Roc Auc: 0.5
30
 
31
  ## Model description
32
 
@@ -61,9 +61,9 @@ The following hyperparameters were used during training:
61
 
62
  | Training Loss | Epoch | Step | Validation Loss | Accuracy | F1 | Precision | Recall | Roc Auc |
63
  |:-------------:|:-----:|:----:|:---------------:|:--------:|:------:|:---------:|:------:|:-------:|
64
- | No log | 0.992 | 31 | 0.6806 | 0.673 | 0.7940 | 0.7300 | 0.8702 | 0.5130 |
65
- | No log | 1.984 | 62 | 0.6696 | 0.724 | 0.8399 | 0.724 | 1.0 | 0.5 |
66
- | No log | 2.976 | 93 | 0.6661 | 0.724 | 0.8399 | 0.724 | 1.0 | 0.5 |
67
 
68
 
69
  ### Framework versions
 
21
 
22
  This model is a fine-tuned version of [google-bert/bert-base-multilingual-uncased](https://huggingface.co/google-bert/bert-base-multilingual-uncased) on the None dataset.
23
  It achieves the following results on the evaluation set:
24
+ - Loss: 0.6924
25
+ - Accuracy: 0.518
26
+ - F1: 0.6730
27
+ - Precision: 0.6613
28
+ - Recall: 0.6851
29
+ - Roc Auc: 0.3824
30
 
31
  ## Model description
32
 
 
61
 
62
  | Training Loss | Epoch | Step | Validation Loss | Accuracy | F1 | Precision | Recall | Roc Auc |
63
  |:-------------:|:-----:|:----:|:---------------:|:--------:|:------:|:---------:|:------:|:-------:|
64
+ | No log | 0.992 | 31 | 0.7081 | 0.347 | 0.4287 | 0.5847 | 0.3384 | 0.3540 |
65
+ | No log | 1.984 | 62 | 0.6961 | 0.479 | 0.6354 | 0.6440 | 0.6271 | 0.3588 |
66
+ | No log | 2.976 | 93 | 0.6924 | 0.518 | 0.6730 | 0.6613 | 0.6851 | 0.3824 |
67
 
68
 
69
  ### Framework versions
adapter_config.json CHANGED
@@ -3,6 +3,7 @@
3
  "auto_mapping": null,
4
  "base_model_name_or_path": "google-bert/bert-base-multilingual-uncased",
5
  "bias": "none",
 
6
  "exclude_modules": null,
7
  "fan_in_fan_out": false,
8
  "inference_mode": true,
@@ -25,10 +26,22 @@
25
  "rank_pattern": {},
26
  "revision": null,
27
  "target_modules": [
28
- "attention.output.dense",
 
 
 
 
 
29
  "query",
 
 
 
 
30
  "key",
31
- "value"
 
 
 
32
  ],
33
  "task_type": "SEQ_CLS",
34
  "use_dora": false,
 
3
  "auto_mapping": null,
4
  "base_model_name_or_path": "google-bert/bert-base-multilingual-uncased",
5
  "bias": "none",
6
+ "eva_config": null,
7
  "exclude_modules": null,
8
  "fan_in_fan_out": false,
9
  "inference_mode": true,
 
26
  "rank_pattern": {},
27
  "revision": null,
28
  "target_modules": [
29
+ "2.output.dense",
30
+ "10.output.dense",
31
+ "7.output.dense",
32
+ "0.output.dense",
33
+ "11.output.dense",
34
+ "6.output.dense",
35
  "query",
36
+ "intermediate.dense",
37
+ "1.output.dense",
38
+ "3.output.dense",
39
+ "8.output.dense",
40
  "key",
41
+ "4.output.dense",
42
+ "value",
43
+ "9.output.dense",
44
+ "5.output.dense"
45
  ],
46
  "task_type": "SEQ_CLS",
47
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:60574d14a542f2baac667447c36c40f22f0c071753f78d4bd8b3dce2afd37236
3
- size 4738488
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bbf2f8bd5fd0b9ee7d80ff96a52e17294e9a5993f0c4ff96bc133dee7c672233
3
+ size 9460216
tokenizer.json CHANGED
@@ -1,21 +1,7 @@
1
  {
2
  "version": "1.0",
3
- "truncation": {
4
- "direction": "Right",
5
- "max_length": 512,
6
- "strategy": "LongestFirst",
7
- "stride": 0
8
- },
9
- "padding": {
10
- "strategy": {
11
- "Fixed": 512
12
- },
13
- "direction": "Right",
14
- "pad_to_multiple_of": null,
15
- "pad_id": 0,
16
- "pad_type_id": 0,
17
- "pad_token": "[PAD]"
18
- },
19
  "added_tokens": [
20
  {
21
  "id": 0,
 
1
  {
2
  "version": "1.0",
3
+ "truncation": null,
4
+ "padding": null,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5
  "added_tokens": [
6
  {
7
  "id": 0,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5a012e14337c6de9ce53cd647f95a4d1a5be53eb769d49ae62fc6681f71ebd6c
3
  size 5304
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:82b2fd2247497f5b190738596ccaf24d58f63e59709eca93de454d50b8b80ef9
3
  size 5304