sharkMeow commited on
Commit
f506eb8
·
verified ·
1 Parent(s): 2a00f55

End of training

Browse files
Files changed (5) hide show
  1. README.md +5 -1
  2. all_results.json +8 -8
  3. eval_results.json +4 -4
  4. train_results.json +4 -4
  5. trainer_state.json +10 -10
README.md CHANGED
@@ -1,4 +1,6 @@
1
  ---
 
 
2
  tags:
3
  - generated_from_trainer
4
  model-index:
@@ -11,7 +13,9 @@ should probably proofread and complete it, then remove this comment. -->
11
 
12
  # clip-roberta-finetuned
13
 
14
- This model is a fine-tuned version of [](https://huggingface.co/) on an unknown dataset.
 
 
15
 
16
  ## Model description
17
 
 
1
  ---
2
+ license: gpl-3.0
3
+ base_model: ckiplab/bert-base-chinese
4
  tags:
5
  - generated_from_trainer
6
  model-index:
 
13
 
14
  # clip-roberta-finetuned
15
 
16
+ This model is a fine-tuned version of [ckiplab/bert-base-chinese](https://huggingface.co/ckiplab/bert-base-chinese) on an unknown dataset.
17
+ It achieves the following results on the evaluation set:
18
+ - Loss: 7.5963
19
 
20
  ## Model description
21
 
all_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
  "epoch": 100.0,
3
- "eval_loss": 0.054326437413692474,
4
- "eval_runtime": 3.844,
5
- "eval_samples_per_second": 326.223,
6
- "eval_steps_per_second": 3.382,
7
  "total_flos": 1.6588112479488e+16,
8
- "train_loss": 0.4321923828125,
9
- "train_runtime": 849.2414,
10
- "train_samples_per_second": 147.661,
11
- "train_steps_per_second": 1.884
12
  }
 
1
  {
2
  "epoch": 100.0,
3
+ "eval_loss": 7.596293926239014,
4
+ "eval_runtime": 2.0803,
5
+ "eval_samples_per_second": 344.176,
6
+ "eval_steps_per_second": 2.884,
7
  "total_flos": 1.6588112479488e+16,
8
+ "train_loss": 0.5603914216160775,
9
+ "train_runtime": 845.3181,
10
+ "train_samples_per_second": 148.347,
11
+ "train_steps_per_second": 1.893
12
  }
eval_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "epoch": 100.0,
3
- "eval_loss": 0.054326437413692474,
4
- "eval_runtime": 3.844,
5
- "eval_samples_per_second": 326.223,
6
- "eval_steps_per_second": 3.382
7
  }
 
1
  {
2
  "epoch": 100.0,
3
+ "eval_loss": 7.596293926239014,
4
+ "eval_runtime": 2.0803,
5
+ "eval_samples_per_second": 344.176,
6
+ "eval_steps_per_second": 2.884
7
  }
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 100.0,
3
  "total_flos": 1.6588112479488e+16,
4
- "train_loss": 0.4321923828125,
5
- "train_runtime": 849.2414,
6
- "train_samples_per_second": 147.661,
7
- "train_steps_per_second": 1.884
8
  }
 
1
  {
2
  "epoch": 100.0,
3
  "total_flos": 1.6588112479488e+16,
4
+ "train_loss": 0.5603914216160775,
5
+ "train_runtime": 845.3181,
6
+ "train_samples_per_second": 148.347,
7
+ "train_steps_per_second": 1.893
8
  }
trainer_state.json CHANGED
@@ -10,33 +10,33 @@
10
  "log_history": [
11
  {
12
  "epoch": 31.25,
13
- "grad_norm": 1.9496452808380127,
14
  "learning_rate": 3.4375e-05,
15
- "loss": 1.2881,
16
  "step": 500
17
  },
18
  {
19
  "epoch": 62.5,
20
- "grad_norm": 0.6210575699806213,
21
  "learning_rate": 1.8750000000000002e-05,
22
- "loss": 0.0667,
23
  "step": 1000
24
  },
25
  {
26
  "epoch": 93.75,
27
- "grad_norm": 0.8036883473396301,
28
  "learning_rate": 3.125e-06,
29
- "loss": 0.0245,
30
  "step": 1500
31
  },
32
  {
33
  "epoch": 100.0,
34
  "step": 1600,
35
  "total_flos": 1.6588112479488e+16,
36
- "train_loss": 0.4321923828125,
37
- "train_runtime": 849.2414,
38
- "train_samples_per_second": 147.661,
39
- "train_steps_per_second": 1.884
40
  }
41
  ],
42
  "logging_steps": 500,
 
10
  "log_history": [
11
  {
12
  "epoch": 31.25,
13
+ "grad_norm": 4.7310919761657715,
14
  "learning_rate": 3.4375e-05,
15
+ "loss": 1.633,
16
  "step": 500
17
  },
18
  {
19
  "epoch": 62.5,
20
+ "grad_norm": 1.100446105003357,
21
  "learning_rate": 1.8750000000000002e-05,
22
+ "loss": 0.1162,
23
  "step": 1000
24
  },
25
  {
26
  "epoch": 93.75,
27
+ "grad_norm": 0.6620476841926575,
28
  "learning_rate": 3.125e-06,
29
+ "loss": 0.0385,
30
  "step": 1500
31
  },
32
  {
33
  "epoch": 100.0,
34
  "step": 1600,
35
  "total_flos": 1.6588112479488e+16,
36
+ "train_loss": 0.5603914216160775,
37
+ "train_runtime": 845.3181,
38
+ "train_samples_per_second": 148.347,
39
+ "train_steps_per_second": 1.893
40
  }
41
  ],
42
  "logging_steps": 500,