end of training 3 epochs
Browse files- last-checkpoint/config.json +0 -38
- last-checkpoint/optimizer.pt +0 -3
- last-checkpoint/pytorch_model.bin +0 -3
- last-checkpoint/rng_state.pth +0 -3
- last-checkpoint/special_tokens_map.json +0 -1
- last-checkpoint/tokenizer.json +0 -0
- last-checkpoint/tokenizer_config.json +0 -1
- last-checkpoint/trainer_state.json +0 -33
- last-checkpoint/vocab.txt +0 -0
- pytorch_model.bin +1 -1
- last-checkpoint/scheduler.pt → runs/May20_16-45-11_1556878e54c8/1653069099.1539524/events.out.tfevents.1653069099.1556878e54c8.71.3 +2 -2
- runs/May20_16-45-11_1556878e54c8/events.out.tfevents.1653065256.1556878e54c8.71.0 +2 -2
- last-checkpoint/training_args.bin → runs/May20_16-45-11_1556878e54c8/events.out.tfevents.1653069099.1556878e54c8.71.2 +2 -2
last-checkpoint/config.json
DELETED
@@ -1,38 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"_name_or_path": "distilbert-base-cased",
|
3 |
-
"activation": "gelu",
|
4 |
-
"architectures": [
|
5 |
-
"DistilBertForSequenceClassification"
|
6 |
-
],
|
7 |
-
"attention_dropout": 0.1,
|
8 |
-
"dim": 768,
|
9 |
-
"dropout": 0.1,
|
10 |
-
"hidden_dim": 3072,
|
11 |
-
"id2label": {
|
12 |
-
"0": "anger",
|
13 |
-
"1": "joy",
|
14 |
-
"2": "optimism",
|
15 |
-
"3": "sadness"
|
16 |
-
},
|
17 |
-
"initializer_range": 0.02,
|
18 |
-
"label2id": {
|
19 |
-
"anger": 0,
|
20 |
-
"joy": 1,
|
21 |
-
"optimism": 2,
|
22 |
-
"sadness": 3
|
23 |
-
},
|
24 |
-
"max_position_embeddings": 512,
|
25 |
-
"model_type": "distilbert",
|
26 |
-
"n_heads": 12,
|
27 |
-
"n_layers": 6,
|
28 |
-
"output_past": true,
|
29 |
-
"pad_token_id": 0,
|
30 |
-
"problem_type": "single_label_classification",
|
31 |
-
"qa_dropout": 0.1,
|
32 |
-
"seq_classif_dropout": 0.2,
|
33 |
-
"sinusoidal_pos_embds": false,
|
34 |
-
"tie_weights_": true,
|
35 |
-
"torch_dtype": "float32",
|
36 |
-
"transformers_version": "4.19.2",
|
37 |
-
"vocab_size": 28996
|
38 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
last-checkpoint/optimizer.pt
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:c73959244780ed2bba8e269a5f5733ee0285e79e761a18e2426204da083e85e7
|
3 |
-
size 526333665
|
|
|
|
|
|
|
|
last-checkpoint/pytorch_model.bin
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:dcd4a646170bae452fd479376c51512baf9048ba690f562eced96391ff6f7489
|
3 |
-
size 263171185
|
|
|
|
|
|
|
|
last-checkpoint/rng_state.pth
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:28a456a7185f5f7b097c752c4b588206eb05b773927f71481138433c212d65fd
|
3 |
-
size 13547
|
|
|
|
|
|
|
|
last-checkpoint/special_tokens_map.json
DELETED
@@ -1 +0,0 @@
|
|
1 |
-
{"unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]"}
|
|
|
|
last-checkpoint/tokenizer.json
DELETED
The diff for this file is too large to render.
See raw diff
|
|
last-checkpoint/tokenizer_config.json
DELETED
@@ -1 +0,0 @@
|
|
1 |
-
{"do_lower_case": false, "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "tokenize_chinese_chars": true, "strip_accents": null, "model_max_length": 512, "special_tokens_map_file": null, "name_or_path": "distilbert-base-cased", "tokenizer_class": "DistilBertTokenizer"}
|
|
|
|
last-checkpoint/trainer_state.json
DELETED
@@ -1,33 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"best_metric": 0.6013594903216822,
|
3 |
-
"best_model_checkpoint": "bert-emotion/checkpoint-815",
|
4 |
-
"epoch": 1.0,
|
5 |
-
"global_step": 815,
|
6 |
-
"is_hyper_param_search": false,
|
7 |
-
"is_local_process_zero": true,
|
8 |
-
"is_world_process_zero": true,
|
9 |
-
"log_history": [
|
10 |
-
{
|
11 |
-
"epoch": 1.0,
|
12 |
-
"learning_rate": 3.3333333333333335e-05,
|
13 |
-
"loss": 0.8385,
|
14 |
-
"step": 815
|
15 |
-
},
|
16 |
-
{
|
17 |
-
"epoch": 1.0,
|
18 |
-
"eval_fscore": 0.6013594903216822,
|
19 |
-
"eval_loss": 0.8365974426269531,
|
20 |
-
"eval_precision": 0.7865216201423099,
|
21 |
-
"eval_recall": 0.5968172119855704,
|
22 |
-
"eval_runtime": 25.3715,
|
23 |
-
"eval_samples_per_second": 14.741,
|
24 |
-
"eval_steps_per_second": 3.705,
|
25 |
-
"step": 815
|
26 |
-
}
|
27 |
-
],
|
28 |
-
"max_steps": 2445,
|
29 |
-
"num_train_epochs": 3,
|
30 |
-
"total_flos": 31667823325320.0,
|
31 |
-
"trial_name": null,
|
32 |
-
"trial_params": null
|
33 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
last-checkpoint/vocab.txt
DELETED
The diff for this file is too large to render.
See raw diff
|
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 263171185
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:813d4e42b9a3f77dcfe3511134461f3f43941a14f4b260dcf89aae7c93ad56b7
|
3 |
size 263171185
|
last-checkpoint/scheduler.pt → runs/May20_16-45-11_1556878e54c8/1653069099.1539524/events.out.tfevents.1653069099.1556878e54c8.71.3
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a71ee3d814bc7818a8ceb0373c3a311690087d6d50f508a3b908ff0f746c40f1
|
3 |
+
size 5150
|
runs/May20_16-45-11_1556878e54c8/events.out.tfevents.1653065256.1556878e54c8.71.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fab5a0c7cc68f8cea44fb0093184eb4c36a06a1c0e5e7fb65ecd80ef90129881
|
3 |
+
size 5625
|
last-checkpoint/training_args.bin → runs/May20_16-45-11_1556878e54c8/events.out.tfevents.1653069099.1556878e54c8.71.2
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c8ceaa079af562097b56d679390fa6b42d45a1e54a3c35edd86a4e908a140e02
|
3 |
+
size 5625
|