CristianR8
commited on
Commit
•
3dcd2a2
1
Parent(s):
ca27277
End of training
Browse files- README.md +5 -3
- all_results.json +6 -6
- eval_results.json +3 -3
- train_results.json +3 -3
- trainer_state.json +304 -304
README.md
CHANGED
@@ -3,6 +3,8 @@ library_name: transformers
|
|
3 |
license: apache-2.0
|
4 |
base_model: google/efficientnet-b0
|
5 |
tags:
|
|
|
|
|
6 |
- generated_from_trainer
|
7 |
metrics:
|
8 |
- accuracy
|
@@ -16,10 +18,10 @@ should probably proofread and complete it, then remove this comment. -->
|
|
16 |
|
17 |
# efficientnet-b0-cocoa
|
18 |
|
19 |
-
This model is a fine-tuned version of [google/efficientnet-b0](https://huggingface.co/google/efficientnet-b0) on
|
20 |
It achieves the following results on the evaluation set:
|
21 |
-
- Loss: 0.
|
22 |
-
- Accuracy: 0.
|
23 |
|
24 |
## Model description
|
25 |
|
|
|
3 |
license: apache-2.0
|
4 |
base_model: google/efficientnet-b0
|
5 |
tags:
|
6 |
+
- image-classification
|
7 |
+
- vision
|
8 |
- generated_from_trainer
|
9 |
metrics:
|
10 |
- accuracy
|
|
|
18 |
|
19 |
# efficientnet-b0-cocoa
|
20 |
|
21 |
+
This model is a fine-tuned version of [google/efficientnet-b0](https://huggingface.co/google/efficientnet-b0) on the SemilleroCV/Cocoa-dataset dataset.
|
22 |
It achieves the following results on the evaluation set:
|
23 |
+
- Loss: 0.2657
|
24 |
+
- Accuracy: 0.9097
|
25 |
|
26 |
## Model description
|
27 |
|
all_results.json
CHANGED
@@ -2,12 +2,12 @@
|
|
2 |
"epoch": 100.0,
|
3 |
"eval_accuracy": 0.9097472924187726,
|
4 |
"eval_loss": 0.26566287875175476,
|
5 |
-
"eval_runtime": 0.
|
6 |
-
"eval_samples_per_second":
|
7 |
-
"eval_steps_per_second":
|
8 |
"total_flos": 5.678990728814592e+17,
|
9 |
"train_loss": 0.30055975163317455,
|
10 |
-
"train_runtime":
|
11 |
-
"train_samples_per_second":
|
12 |
-
"train_steps_per_second": 20.
|
13 |
}
|
|
|
2 |
"epoch": 100.0,
|
3 |
"eval_accuracy": 0.9097472924187726,
|
4 |
"eval_loss": 0.26566287875175476,
|
5 |
+
"eval_runtime": 0.9793,
|
6 |
+
"eval_samples_per_second": 282.857,
|
7 |
+
"eval_steps_per_second": 35.74,
|
8 |
"total_flos": 5.678990728814592e+17,
|
9 |
"train_loss": 0.30055975163317455,
|
10 |
+
"train_runtime": 949.6972,
|
11 |
+
"train_samples_per_second": 164.895,
|
12 |
+
"train_steps_per_second": 20.638
|
13 |
}
|
eval_results.json
CHANGED
@@ -2,7 +2,7 @@
|
|
2 |
"epoch": 100.0,
|
3 |
"eval_accuracy": 0.9097472924187726,
|
4 |
"eval_loss": 0.26566287875175476,
|
5 |
-
"eval_runtime": 0.
|
6 |
-
"eval_samples_per_second":
|
7 |
-
"eval_steps_per_second":
|
8 |
}
|
|
|
2 |
"epoch": 100.0,
|
3 |
"eval_accuracy": 0.9097472924187726,
|
4 |
"eval_loss": 0.26566287875175476,
|
5 |
+
"eval_runtime": 0.9793,
|
6 |
+
"eval_samples_per_second": 282.857,
|
7 |
+
"eval_steps_per_second": 35.74
|
8 |
}
|
train_results.json
CHANGED
@@ -2,7 +2,7 @@
|
|
2 |
"epoch": 100.0,
|
3 |
"total_flos": 5.678990728814592e+17,
|
4 |
"train_loss": 0.30055975163317455,
|
5 |
-
"train_runtime":
|
6 |
-
"train_samples_per_second":
|
7 |
-
"train_steps_per_second": 20.
|
8 |
}
|
|
|
2 |
"epoch": 100.0,
|
3 |
"total_flos": 5.678990728814592e+17,
|
4 |
"train_loss": 0.30055975163317455,
|
5 |
+
"train_runtime": 949.6972,
|
6 |
+
"train_samples_per_second": 164.895,
|
7 |
+
"train_steps_per_second": 20.638
|
8 |
}
|
trainer_state.json
CHANGED
@@ -1,6 +1,6 @@
|
|
1 |
{
|
2 |
"best_metric": 0.26566287875175476,
|
3 |
-
"best_model_checkpoint": "./
|
4 |
"epoch": 100.0,
|
5 |
"eval_steps": 500,
|
6 |
"global_step": 19600,
|
@@ -145,9 +145,9 @@
|
|
145 |
"epoch": 1.0,
|
146 |
"eval_accuracy": 0.5595667870036101,
|
147 |
"eval_loss": 1.5222723484039307,
|
148 |
-
"eval_runtime": 0.
|
149 |
-
"eval_samples_per_second":
|
150 |
-
"eval_steps_per_second": 36.
|
151 |
"step": 196
|
152 |
},
|
153 |
{
|
@@ -294,9 +294,9 @@
|
|
294 |
"epoch": 2.0,
|
295 |
"eval_accuracy": 0.8303249097472925,
|
296 |
"eval_loss": 0.8974758386611938,
|
297 |
-
"eval_runtime": 0.
|
298 |
-
"eval_samples_per_second":
|
299 |
-
"eval_steps_per_second": 37.
|
300 |
"step": 392
|
301 |
},
|
302 |
{
|
@@ -436,9 +436,9 @@
|
|
436 |
"epoch": 3.0,
|
437 |
"eval_accuracy": 0.8772563176895307,
|
438 |
"eval_loss": 0.6563544273376465,
|
439 |
-
"eval_runtime": 0.
|
440 |
-
"eval_samples_per_second":
|
441 |
-
"eval_steps_per_second": 37.
|
442 |
"step": 588
|
443 |
},
|
444 |
{
|
@@ -585,9 +585,9 @@
|
|
585 |
"epoch": 4.0,
|
586 |
"eval_accuracy": 0.8339350180505415,
|
587 |
"eval_loss": 0.6841569542884827,
|
588 |
-
"eval_runtime": 0.
|
589 |
-
"eval_samples_per_second":
|
590 |
-
"eval_steps_per_second": 37.
|
591 |
"step": 784
|
592 |
},
|
593 |
{
|
@@ -734,9 +734,9 @@
|
|
734 |
"epoch": 5.0,
|
735 |
"eval_accuracy": 0.8808664259927798,
|
736 |
"eval_loss": 0.48941850662231445,
|
737 |
-
"eval_runtime": 0.
|
738 |
-
"eval_samples_per_second":
|
739 |
-
"eval_steps_per_second": 37.
|
740 |
"step": 980
|
741 |
},
|
742 |
{
|
@@ -876,9 +876,9 @@
|
|
876 |
"epoch": 6.0,
|
877 |
"eval_accuracy": 0.8736462093862816,
|
878 |
"eval_loss": 0.41603580117225647,
|
879 |
-
"eval_runtime": 0.
|
880 |
-
"eval_samples_per_second":
|
881 |
-
"eval_steps_per_second": 37.
|
882 |
"step": 1176
|
883 |
},
|
884 |
{
|
@@ -1025,9 +1025,9 @@
|
|
1025 |
"epoch": 7.0,
|
1026 |
"eval_accuracy": 0.8844765342960289,
|
1027 |
"eval_loss": 0.40221381187438965,
|
1028 |
-
"eval_runtime": 0.
|
1029 |
-
"eval_samples_per_second":
|
1030 |
-
"eval_steps_per_second":
|
1031 |
"step": 1372
|
1032 |
},
|
1033 |
{
|
@@ -1167,9 +1167,9 @@
|
|
1167 |
"epoch": 8.0,
|
1168 |
"eval_accuracy": 0.8411552346570397,
|
1169 |
"eval_loss": 0.4939042627811432,
|
1170 |
-
"eval_runtime": 0.
|
1171 |
-
"eval_samples_per_second":
|
1172 |
-
"eval_steps_per_second": 37.
|
1173 |
"step": 1568
|
1174 |
},
|
1175 |
{
|
@@ -1316,9 +1316,9 @@
|
|
1316 |
"epoch": 9.0,
|
1317 |
"eval_accuracy": 0.8772563176895307,
|
1318 |
"eval_loss": 0.35403916239738464,
|
1319 |
-
"eval_runtime": 0.
|
1320 |
-
"eval_samples_per_second":
|
1321 |
-
"eval_steps_per_second":
|
1322 |
"step": 1764
|
1323 |
},
|
1324 |
{
|
@@ -1465,9 +1465,9 @@
|
|
1465 |
"epoch": 10.0,
|
1466 |
"eval_accuracy": 0.8953068592057761,
|
1467 |
"eval_loss": 0.349290668964386,
|
1468 |
-
"eval_runtime": 0.
|
1469 |
-
"eval_samples_per_second":
|
1470 |
-
"eval_steps_per_second": 37.
|
1471 |
"step": 1960
|
1472 |
},
|
1473 |
{
|
@@ -1607,9 +1607,9 @@
|
|
1607 |
"epoch": 11.0,
|
1608 |
"eval_accuracy": 0.776173285198556,
|
1609 |
"eval_loss": 0.7928438186645508,
|
1610 |
-
"eval_runtime": 0.
|
1611 |
-
"eval_samples_per_second":
|
1612 |
-
"eval_steps_per_second": 37.
|
1613 |
"step": 2156
|
1614 |
},
|
1615 |
{
|
@@ -1756,9 +1756,9 @@
|
|
1756 |
"epoch": 12.0,
|
1757 |
"eval_accuracy": 0.296028880866426,
|
1758 |
"eval_loss": 2.06593918800354,
|
1759 |
-
"eval_runtime": 0.
|
1760 |
-
"eval_samples_per_second":
|
1761 |
-
"eval_steps_per_second":
|
1762 |
"step": 2352
|
1763 |
},
|
1764 |
{
|
@@ -1898,9 +1898,9 @@
|
|
1898 |
"epoch": 13.0,
|
1899 |
"eval_accuracy": 0.851985559566787,
|
1900 |
"eval_loss": 0.44439464807510376,
|
1901 |
-
"eval_runtime": 0.
|
1902 |
-
"eval_samples_per_second":
|
1903 |
-
"eval_steps_per_second": 37.
|
1904 |
"step": 2548
|
1905 |
},
|
1906 |
{
|
@@ -2047,9 +2047,9 @@
|
|
2047 |
"epoch": 14.0,
|
2048 |
"eval_accuracy": 0.8736462093862816,
|
2049 |
"eval_loss": 0.46400919556617737,
|
2050 |
-
"eval_runtime": 0.
|
2051 |
-
"eval_samples_per_second":
|
2052 |
-
"eval_steps_per_second":
|
2053 |
"step": 2744
|
2054 |
},
|
2055 |
{
|
@@ -2196,9 +2196,9 @@
|
|
2196 |
"epoch": 15.0,
|
2197 |
"eval_accuracy": 0.8772563176895307,
|
2198 |
"eval_loss": 0.37753719091415405,
|
2199 |
-
"eval_runtime": 0.
|
2200 |
-
"eval_samples_per_second":
|
2201 |
-
"eval_steps_per_second": 37.
|
2202 |
"step": 2940
|
2203 |
},
|
2204 |
{
|
@@ -2338,9 +2338,9 @@
|
|
2338 |
"epoch": 16.0,
|
2339 |
"eval_accuracy": 0.8880866425992779,
|
2340 |
"eval_loss": 0.3519056737422943,
|
2341 |
-
"eval_runtime": 0.
|
2342 |
-
"eval_samples_per_second":
|
2343 |
-
"eval_steps_per_second": 37.
|
2344 |
"step": 3136
|
2345 |
},
|
2346 |
{
|
@@ -2487,9 +2487,9 @@
|
|
2487 |
"epoch": 17.0,
|
2488 |
"eval_accuracy": 0.9061371841155235,
|
2489 |
"eval_loss": 0.33103030920028687,
|
2490 |
-
"eval_runtime": 0.
|
2491 |
-
"eval_samples_per_second":
|
2492 |
-
"eval_steps_per_second": 37.
|
2493 |
"step": 3332
|
2494 |
},
|
2495 |
{
|
@@ -2629,9 +2629,9 @@
|
|
2629 |
"epoch": 18.0,
|
2630 |
"eval_accuracy": 0.8916967509025271,
|
2631 |
"eval_loss": 0.34751203656196594,
|
2632 |
-
"eval_runtime": 0.
|
2633 |
-
"eval_samples_per_second":
|
2634 |
-
"eval_steps_per_second":
|
2635 |
"step": 3528
|
2636 |
},
|
2637 |
{
|
@@ -2778,9 +2778,9 @@
|
|
2778 |
"epoch": 19.0,
|
2779 |
"eval_accuracy": 0.8592057761732852,
|
2780 |
"eval_loss": 0.38391339778900146,
|
2781 |
-
"eval_runtime": 0.
|
2782 |
-
"eval_samples_per_second":
|
2783 |
-
"eval_steps_per_second": 37.
|
2784 |
"step": 3724
|
2785 |
},
|
2786 |
{
|
@@ -2927,9 +2927,9 @@
|
|
2927 |
"epoch": 20.0,
|
2928 |
"eval_accuracy": 0.9133574007220217,
|
2929 |
"eval_loss": 0.3031846880912781,
|
2930 |
-
"eval_runtime": 0.
|
2931 |
-
"eval_samples_per_second":
|
2932 |
-
"eval_steps_per_second": 37.
|
2933 |
"step": 3920
|
2934 |
},
|
2935 |
{
|
@@ -3069,9 +3069,9 @@
|
|
3069 |
"epoch": 21.0,
|
3070 |
"eval_accuracy": 0.851985559566787,
|
3071 |
"eval_loss": 0.4246116876602173,
|
3072 |
-
"eval_runtime": 0.
|
3073 |
-
"eval_samples_per_second":
|
3074 |
-
"eval_steps_per_second":
|
3075 |
"step": 4116
|
3076 |
},
|
3077 |
{
|
@@ -3218,9 +3218,9 @@
|
|
3218 |
"epoch": 22.0,
|
3219 |
"eval_accuracy": 0.8989169675090253,
|
3220 |
"eval_loss": 0.29509276151657104,
|
3221 |
-
"eval_runtime": 0.
|
3222 |
-
"eval_samples_per_second":
|
3223 |
-
"eval_steps_per_second":
|
3224 |
"step": 4312
|
3225 |
},
|
3226 |
{
|
@@ -3360,9 +3360,9 @@
|
|
3360 |
"epoch": 23.0,
|
3361 |
"eval_accuracy": 0.851985559566787,
|
3362 |
"eval_loss": 0.4356595277786255,
|
3363 |
-
"eval_runtime": 0.
|
3364 |
-
"eval_samples_per_second":
|
3365 |
-
"eval_steps_per_second":
|
3366 |
"step": 4508
|
3367 |
},
|
3368 |
{
|
@@ -3509,9 +3509,9 @@
|
|
3509 |
"epoch": 24.0,
|
3510 |
"eval_accuracy": 0.8916967509025271,
|
3511 |
"eval_loss": 0.399036169052124,
|
3512 |
-
"eval_runtime": 0.
|
3513 |
-
"eval_samples_per_second":
|
3514 |
-
"eval_steps_per_second":
|
3515 |
"step": 4704
|
3516 |
},
|
3517 |
{
|
@@ -3658,9 +3658,9 @@
|
|
3658 |
"epoch": 25.0,
|
3659 |
"eval_accuracy": 0.9097472924187726,
|
3660 |
"eval_loss": 0.35359257459640503,
|
3661 |
-
"eval_runtime": 0.
|
3662 |
-
"eval_samples_per_second":
|
3663 |
-
"eval_steps_per_second":
|
3664 |
"step": 4900
|
3665 |
},
|
3666 |
{
|
@@ -3800,9 +3800,9 @@
|
|
3800 |
"epoch": 26.0,
|
3801 |
"eval_accuracy": 0.8592057761732852,
|
3802 |
"eval_loss": 0.4166140854358673,
|
3803 |
-
"eval_runtime": 0.
|
3804 |
-
"eval_samples_per_second":
|
3805 |
-
"eval_steps_per_second":
|
3806 |
"step": 5096
|
3807 |
},
|
3808 |
{
|
@@ -3949,9 +3949,9 @@
|
|
3949 |
"epoch": 27.0,
|
3950 |
"eval_accuracy": 0.851985559566787,
|
3951 |
"eval_loss": 0.4353993237018585,
|
3952 |
-
"eval_runtime": 0.
|
3953 |
-
"eval_samples_per_second":
|
3954 |
-
"eval_steps_per_second": 37.
|
3955 |
"step": 5292
|
3956 |
},
|
3957 |
{
|
@@ -4091,9 +4091,9 @@
|
|
4091 |
"epoch": 28.0,
|
4092 |
"eval_accuracy": 0.8592057761732852,
|
4093 |
"eval_loss": 0.4088672697544098,
|
4094 |
-
"eval_runtime": 0.
|
4095 |
-
"eval_samples_per_second":
|
4096 |
-
"eval_steps_per_second": 37.
|
4097 |
"step": 5488
|
4098 |
},
|
4099 |
{
|
@@ -4240,9 +4240,9 @@
|
|
4240 |
"epoch": 29.0,
|
4241 |
"eval_accuracy": 0.8231046931407943,
|
4242 |
"eval_loss": 0.4787161946296692,
|
4243 |
-
"eval_runtime": 0.
|
4244 |
-
"eval_samples_per_second":
|
4245 |
-
"eval_steps_per_second":
|
4246 |
"step": 5684
|
4247 |
},
|
4248 |
{
|
@@ -4389,9 +4389,9 @@
|
|
4389 |
"epoch": 30.0,
|
4390 |
"eval_accuracy": 0.9097472924187726,
|
4391 |
"eval_loss": 0.3165305256843567,
|
4392 |
-
"eval_runtime": 0.
|
4393 |
-
"eval_samples_per_second":
|
4394 |
-
"eval_steps_per_second": 37.
|
4395 |
"step": 5880
|
4396 |
},
|
4397 |
{
|
@@ -4531,9 +4531,9 @@
|
|
4531 |
"epoch": 31.0,
|
4532 |
"eval_accuracy": 0.9133574007220217,
|
4533 |
"eval_loss": 0.31053850054740906,
|
4534 |
-
"eval_runtime": 0.
|
4535 |
-
"eval_samples_per_second":
|
4536 |
-
"eval_steps_per_second": 37.
|
4537 |
"step": 6076
|
4538 |
},
|
4539 |
{
|
@@ -4680,9 +4680,9 @@
|
|
4680 |
"epoch": 32.0,
|
4681 |
"eval_accuracy": 0.9061371841155235,
|
4682 |
"eval_loss": 0.3559906780719757,
|
4683 |
-
"eval_runtime": 0.
|
4684 |
-
"eval_samples_per_second":
|
4685 |
-
"eval_steps_per_second":
|
4686 |
"step": 6272
|
4687 |
},
|
4688 |
{
|
@@ -4822,9 +4822,9 @@
|
|
4822 |
"epoch": 33.0,
|
4823 |
"eval_accuracy": 0.9097472924187726,
|
4824 |
"eval_loss": 0.26566287875175476,
|
4825 |
-
"eval_runtime": 0.
|
4826 |
-
"eval_samples_per_second":
|
4827 |
-
"eval_steps_per_second": 37.
|
4828 |
"step": 6468
|
4829 |
},
|
4830 |
{
|
@@ -4971,9 +4971,9 @@
|
|
4971 |
"epoch": 34.0,
|
4972 |
"eval_accuracy": 0.9133574007220217,
|
4973 |
"eval_loss": 0.2679595947265625,
|
4974 |
-
"eval_runtime": 0.
|
4975 |
-
"eval_samples_per_second": 295.
|
4976 |
-
"eval_steps_per_second": 37.
|
4977 |
"step": 6664
|
4978 |
},
|
4979 |
{
|
@@ -5120,9 +5120,9 @@
|
|
5120 |
"epoch": 35.0,
|
5121 |
"eval_accuracy": 0.9061371841155235,
|
5122 |
"eval_loss": 0.3797638416290283,
|
5123 |
-
"eval_runtime": 0.
|
5124 |
-
"eval_samples_per_second":
|
5125 |
-
"eval_steps_per_second": 37.
|
5126 |
"step": 6860
|
5127 |
},
|
5128 |
{
|
@@ -5262,9 +5262,9 @@
|
|
5262 |
"epoch": 36.0,
|
5263 |
"eval_accuracy": 0.855595667870036,
|
5264 |
"eval_loss": 0.5098311305046082,
|
5265 |
-
"eval_runtime": 0.
|
5266 |
-
"eval_samples_per_second":
|
5267 |
-
"eval_steps_per_second": 37.
|
5268 |
"step": 7056
|
5269 |
},
|
5270 |
{
|
@@ -5411,9 +5411,9 @@
|
|
5411 |
"epoch": 37.0,
|
5412 |
"eval_accuracy": 0.8808664259927798,
|
5413 |
"eval_loss": 0.42190420627593994,
|
5414 |
-
"eval_runtime": 0.
|
5415 |
-
"eval_samples_per_second":
|
5416 |
-
"eval_steps_per_second": 37.
|
5417 |
"step": 7252
|
5418 |
},
|
5419 |
{
|
@@ -5553,9 +5553,9 @@
|
|
5553 |
"epoch": 38.0,
|
5554 |
"eval_accuracy": 0.9133574007220217,
|
5555 |
"eval_loss": 0.2851579189300537,
|
5556 |
-
"eval_runtime": 0.
|
5557 |
-
"eval_samples_per_second":
|
5558 |
-
"eval_steps_per_second":
|
5559 |
"step": 7448
|
5560 |
},
|
5561 |
{
|
@@ -5702,9 +5702,9 @@
|
|
5702 |
"epoch": 39.0,
|
5703 |
"eval_accuracy": 0.8989169675090253,
|
5704 |
"eval_loss": 0.36030298471450806,
|
5705 |
-
"eval_runtime": 0.
|
5706 |
-
"eval_samples_per_second":
|
5707 |
-
"eval_steps_per_second": 37.
|
5708 |
"step": 7644
|
5709 |
},
|
5710 |
{
|
@@ -5851,9 +5851,9 @@
|
|
5851 |
"epoch": 40.0,
|
5852 |
"eval_accuracy": 0.8736462093862816,
|
5853 |
"eval_loss": 0.351894736289978,
|
5854 |
-
"eval_runtime": 0.
|
5855 |
-
"eval_samples_per_second":
|
5856 |
-
"eval_steps_per_second": 37.
|
5857 |
"step": 7840
|
5858 |
},
|
5859 |
{
|
@@ -5993,9 +5993,9 @@
|
|
5993 |
"epoch": 41.0,
|
5994 |
"eval_accuracy": 0.9025270758122743,
|
5995 |
"eval_loss": 0.3343473970890045,
|
5996 |
-
"eval_runtime": 0.
|
5997 |
-
"eval_samples_per_second":
|
5998 |
-
"eval_steps_per_second": 37.
|
5999 |
"step": 8036
|
6000 |
},
|
6001 |
{
|
@@ -6142,9 +6142,9 @@
|
|
6142 |
"epoch": 42.0,
|
6143 |
"eval_accuracy": 0.9169675090252708,
|
6144 |
"eval_loss": 0.3383941352367401,
|
6145 |
-
"eval_runtime": 0.
|
6146 |
-
"eval_samples_per_second":
|
6147 |
-
"eval_steps_per_second": 37.
|
6148 |
"step": 8232
|
6149 |
},
|
6150 |
{
|
@@ -6284,9 +6284,9 @@
|
|
6284 |
"epoch": 43.0,
|
6285 |
"eval_accuracy": 0.8772563176895307,
|
6286 |
"eval_loss": 0.40458711981773376,
|
6287 |
-
"eval_runtime": 0.
|
6288 |
-
"eval_samples_per_second":
|
6289 |
-
"eval_steps_per_second": 37.
|
6290 |
"step": 8428
|
6291 |
},
|
6292 |
{
|
@@ -6433,9 +6433,9 @@
|
|
6433 |
"epoch": 44.0,
|
6434 |
"eval_accuracy": 0.8916967509025271,
|
6435 |
"eval_loss": 0.39525121450424194,
|
6436 |
-
"eval_runtime": 0.
|
6437 |
-
"eval_samples_per_second":
|
6438 |
-
"eval_steps_per_second": 37.
|
6439 |
"step": 8624
|
6440 |
},
|
6441 |
{
|
@@ -6582,9 +6582,9 @@
|
|
6582 |
"epoch": 45.0,
|
6583 |
"eval_accuracy": 0.8592057761732852,
|
6584 |
"eval_loss": 0.5002943873405457,
|
6585 |
-
"eval_runtime": 0.
|
6586 |
-
"eval_samples_per_second": 297.
|
6587 |
-
"eval_steps_per_second": 37.
|
6588 |
"step": 8820
|
6589 |
},
|
6590 |
{
|
@@ -6724,9 +6724,9 @@
|
|
6724 |
"epoch": 46.0,
|
6725 |
"eval_accuracy": 0.9169675090252708,
|
6726 |
"eval_loss": 0.3231888711452484,
|
6727 |
-
"eval_runtime": 0.
|
6728 |
-
"eval_samples_per_second":
|
6729 |
-
"eval_steps_per_second": 37.
|
6730 |
"step": 9016
|
6731 |
},
|
6732 |
{
|
@@ -6873,9 +6873,9 @@
|
|
6873 |
"epoch": 47.0,
|
6874 |
"eval_accuracy": 0.9169675090252708,
|
6875 |
"eval_loss": 0.3112559914588928,
|
6876 |
-
"eval_runtime": 0.
|
6877 |
-
"eval_samples_per_second":
|
6878 |
-
"eval_steps_per_second": 37.
|
6879 |
"step": 9212
|
6880 |
},
|
6881 |
{
|
@@ -7015,9 +7015,9 @@
|
|
7015 |
"epoch": 48.0,
|
7016 |
"eval_accuracy": 0.855595667870036,
|
7017 |
"eval_loss": 0.4494384229183197,
|
7018 |
-
"eval_runtime": 0.
|
7019 |
-
"eval_samples_per_second":
|
7020 |
-
"eval_steps_per_second": 37.
|
7021 |
"step": 9408
|
7022 |
},
|
7023 |
{
|
@@ -7164,9 +7164,9 @@
|
|
7164 |
"epoch": 49.0,
|
7165 |
"eval_accuracy": 0.9205776173285198,
|
7166 |
"eval_loss": 0.37217509746551514,
|
7167 |
-
"eval_runtime": 0.
|
7168 |
-
"eval_samples_per_second":
|
7169 |
-
"eval_steps_per_second": 37.
|
7170 |
"step": 9604
|
7171 |
},
|
7172 |
{
|
@@ -7313,9 +7313,9 @@
|
|
7313 |
"epoch": 50.0,
|
7314 |
"eval_accuracy": 0.9097472924187726,
|
7315 |
"eval_loss": 0.2852139472961426,
|
7316 |
-
"eval_runtime": 0.
|
7317 |
-
"eval_samples_per_second":
|
7318 |
-
"eval_steps_per_second": 37.
|
7319 |
"step": 9800
|
7320 |
},
|
7321 |
{
|
@@ -7455,9 +7455,9 @@
|
|
7455 |
"epoch": 51.0,
|
7456 |
"eval_accuracy": 0.8628158844765343,
|
7457 |
"eval_loss": 0.4137951135635376,
|
7458 |
-
"eval_runtime": 0.
|
7459 |
-
"eval_samples_per_second":
|
7460 |
-
"eval_steps_per_second": 37.
|
7461 |
"step": 9996
|
7462 |
},
|
7463 |
{
|
@@ -7604,9 +7604,9 @@
|
|
7604 |
"epoch": 52.0,
|
7605 |
"eval_accuracy": 0.8953068592057761,
|
7606 |
"eval_loss": 0.34130236506462097,
|
7607 |
-
"eval_runtime": 0.
|
7608 |
-
"eval_samples_per_second":
|
7609 |
-
"eval_steps_per_second":
|
7610 |
"step": 10192
|
7611 |
},
|
7612 |
{
|
@@ -7746,9 +7746,9 @@
|
|
7746 |
"epoch": 53.0,
|
7747 |
"eval_accuracy": 0.9169675090252708,
|
7748 |
"eval_loss": 0.30462250113487244,
|
7749 |
-
"eval_runtime": 0.
|
7750 |
-
"eval_samples_per_second":
|
7751 |
-
"eval_steps_per_second":
|
7752 |
"step": 10388
|
7753 |
},
|
7754 |
{
|
@@ -7895,9 +7895,9 @@
|
|
7895 |
"epoch": 54.0,
|
7896 |
"eval_accuracy": 0.8989169675090253,
|
7897 |
"eval_loss": 0.2849152684211731,
|
7898 |
-
"eval_runtime": 0.
|
7899 |
-
"eval_samples_per_second":
|
7900 |
-
"eval_steps_per_second": 37.
|
7901 |
"step": 10584
|
7902 |
},
|
7903 |
{
|
@@ -8044,9 +8044,9 @@
|
|
8044 |
"epoch": 55.0,
|
8045 |
"eval_accuracy": 0.9133574007220217,
|
8046 |
"eval_loss": 0.35168057680130005,
|
8047 |
-
"eval_runtime": 0.
|
8048 |
-
"eval_samples_per_second":
|
8049 |
-
"eval_steps_per_second": 37.
|
8050 |
"step": 10780
|
8051 |
},
|
8052 |
{
|
@@ -8186,9 +8186,9 @@
|
|
8186 |
"epoch": 56.0,
|
8187 |
"eval_accuracy": 0.9025270758122743,
|
8188 |
"eval_loss": 0.45381447672843933,
|
8189 |
-
"eval_runtime": 0.
|
8190 |
-
"eval_samples_per_second":
|
8191 |
-
"eval_steps_per_second":
|
8192 |
"step": 10976
|
8193 |
},
|
8194 |
{
|
@@ -8335,9 +8335,9 @@
|
|
8335 |
"epoch": 57.0,
|
8336 |
"eval_accuracy": 0.8592057761732852,
|
8337 |
"eval_loss": 0.44916799664497375,
|
8338 |
-
"eval_runtime": 0.
|
8339 |
-
"eval_samples_per_second": 295.
|
8340 |
-
"eval_steps_per_second": 37.
|
8341 |
"step": 11172
|
8342 |
},
|
8343 |
{
|
@@ -8477,9 +8477,9 @@
|
|
8477 |
"epoch": 58.0,
|
8478 |
"eval_accuracy": 0.8628158844765343,
|
8479 |
"eval_loss": 0.4738902747631073,
|
8480 |
-
"eval_runtime": 0.
|
8481 |
-
"eval_samples_per_second":
|
8482 |
-
"eval_steps_per_second": 37.
|
8483 |
"step": 11368
|
8484 |
},
|
8485 |
{
|
@@ -8626,9 +8626,9 @@
|
|
8626 |
"epoch": 59.0,
|
8627 |
"eval_accuracy": 0.9205776173285198,
|
8628 |
"eval_loss": 0.2831103205680847,
|
8629 |
-
"eval_runtime": 0.
|
8630 |
-
"eval_samples_per_second":
|
8631 |
-
"eval_steps_per_second": 37.
|
8632 |
"step": 11564
|
8633 |
},
|
8634 |
{
|
@@ -8775,9 +8775,9 @@
|
|
8775 |
"epoch": 60.0,
|
8776 |
"eval_accuracy": 0.9205776173285198,
|
8777 |
"eval_loss": 0.34654152393341064,
|
8778 |
-
"eval_runtime": 0.
|
8779 |
-
"eval_samples_per_second":
|
8780 |
-
"eval_steps_per_second": 37.
|
8781 |
"step": 11760
|
8782 |
},
|
8783 |
{
|
@@ -8917,9 +8917,9 @@
|
|
8917 |
"epoch": 61.0,
|
8918 |
"eval_accuracy": 0.9314079422382672,
|
8919 |
"eval_loss": 0.28843551874160767,
|
8920 |
-
"eval_runtime": 0.
|
8921 |
-
"eval_samples_per_second": 295.
|
8922 |
-
"eval_steps_per_second": 37.
|
8923 |
"step": 11956
|
8924 |
},
|
8925 |
{
|
@@ -9066,9 +9066,9 @@
|
|
9066 |
"epoch": 62.0,
|
9067 |
"eval_accuracy": 0.8447653429602888,
|
9068 |
"eval_loss": 0.4874745309352875,
|
9069 |
-
"eval_runtime": 0.
|
9070 |
-
"eval_samples_per_second":
|
9071 |
-
"eval_steps_per_second": 37.
|
9072 |
"step": 12152
|
9073 |
},
|
9074 |
{
|
@@ -9208,9 +9208,9 @@
|
|
9208 |
"epoch": 63.0,
|
9209 |
"eval_accuracy": 0.9061371841155235,
|
9210 |
"eval_loss": 0.3988655209541321,
|
9211 |
-
"eval_runtime": 0.
|
9212 |
-
"eval_samples_per_second":
|
9213 |
-
"eval_steps_per_second": 37.
|
9214 |
"step": 12348
|
9215 |
},
|
9216 |
{
|
@@ -9357,9 +9357,9 @@
|
|
9357 |
"epoch": 64.0,
|
9358 |
"eval_accuracy": 0.851985559566787,
|
9359 |
"eval_loss": 0.5952923893928528,
|
9360 |
-
"eval_runtime": 0.
|
9361 |
-
"eval_samples_per_second":
|
9362 |
-
"eval_steps_per_second": 37.
|
9363 |
"step": 12544
|
9364 |
},
|
9365 |
{
|
@@ -9506,9 +9506,9 @@
|
|
9506 |
"epoch": 65.0,
|
9507 |
"eval_accuracy": 0.927797833935018,
|
9508 |
"eval_loss": 0.2953914701938629,
|
9509 |
-
"eval_runtime": 0.
|
9510 |
-
"eval_samples_per_second":
|
9511 |
-
"eval_steps_per_second":
|
9512 |
"step": 12740
|
9513 |
},
|
9514 |
{
|
@@ -9648,9 +9648,9 @@
|
|
9648 |
"epoch": 66.0,
|
9649 |
"eval_accuracy": 0.851985559566787,
|
9650 |
"eval_loss": 0.5033073425292969,
|
9651 |
-
"eval_runtime": 0.
|
9652 |
-
"eval_samples_per_second":
|
9653 |
-
"eval_steps_per_second": 37.
|
9654 |
"step": 12936
|
9655 |
},
|
9656 |
{
|
@@ -9797,9 +9797,9 @@
|
|
9797 |
"epoch": 67.0,
|
9798 |
"eval_accuracy": 0.8808664259927798,
|
9799 |
"eval_loss": 0.41321179270744324,
|
9800 |
-
"eval_runtime": 0.
|
9801 |
-
"eval_samples_per_second":
|
9802 |
-
"eval_steps_per_second":
|
9803 |
"step": 13132
|
9804 |
},
|
9805 |
{
|
@@ -9939,9 +9939,9 @@
|
|
9939 |
"epoch": 68.0,
|
9940 |
"eval_accuracy": 0.9169675090252708,
|
9941 |
"eval_loss": 0.37430626153945923,
|
9942 |
-
"eval_runtime": 0.
|
9943 |
-
"eval_samples_per_second":
|
9944 |
-
"eval_steps_per_second": 37.
|
9945 |
"step": 13328
|
9946 |
},
|
9947 |
{
|
@@ -10088,9 +10088,9 @@
|
|
10088 |
"epoch": 69.0,
|
10089 |
"eval_accuracy": 0.776173285198556,
|
10090 |
"eval_loss": 0.6423271298408508,
|
10091 |
-
"eval_runtime": 0.
|
10092 |
-
"eval_samples_per_second":
|
10093 |
-
"eval_steps_per_second":
|
10094 |
"step": 13524
|
10095 |
},
|
10096 |
{
|
@@ -10237,9 +10237,9 @@
|
|
10237 |
"epoch": 70.0,
|
10238 |
"eval_accuracy": 0.8014440433212996,
|
10239 |
"eval_loss": 0.5979345440864563,
|
10240 |
-
"eval_runtime": 0.
|
10241 |
-
"eval_samples_per_second":
|
10242 |
-
"eval_steps_per_second": 37.
|
10243 |
"step": 13720
|
10244 |
},
|
10245 |
{
|
@@ -10379,9 +10379,9 @@
|
|
10379 |
"epoch": 71.0,
|
10380 |
"eval_accuracy": 0.8989169675090253,
|
10381 |
"eval_loss": 0.43981537222862244,
|
10382 |
-
"eval_runtime": 0.
|
10383 |
-
"eval_samples_per_second":
|
10384 |
-
"eval_steps_per_second": 37.
|
10385 |
"step": 13916
|
10386 |
},
|
10387 |
{
|
@@ -10528,9 +10528,9 @@
|
|
10528 |
"epoch": 72.0,
|
10529 |
"eval_accuracy": 0.8231046931407943,
|
10530 |
"eval_loss": 0.5633912086486816,
|
10531 |
-
"eval_runtime": 0.
|
10532 |
-
"eval_samples_per_second":
|
10533 |
-
"eval_steps_per_second": 37.
|
10534 |
"step": 14112
|
10535 |
},
|
10536 |
{
|
@@ -10670,9 +10670,9 @@
|
|
10670 |
"epoch": 73.0,
|
10671 |
"eval_accuracy": 0.776173285198556,
|
10672 |
"eval_loss": 0.620398223400116,
|
10673 |
-
"eval_runtime": 0.
|
10674 |
-
"eval_samples_per_second":
|
10675 |
-
"eval_steps_per_second": 37.
|
10676 |
"step": 14308
|
10677 |
},
|
10678 |
{
|
@@ -10819,9 +10819,9 @@
|
|
10819 |
"epoch": 74.0,
|
10820 |
"eval_accuracy": 0.8953068592057761,
|
10821 |
"eval_loss": 0.36853671073913574,
|
10822 |
-
"eval_runtime": 0.
|
10823 |
-
"eval_samples_per_second":
|
10824 |
-
"eval_steps_per_second": 37.
|
10825 |
"step": 14504
|
10826 |
},
|
10827 |
{
|
@@ -10968,9 +10968,9 @@
|
|
10968 |
"epoch": 75.0,
|
10969 |
"eval_accuracy": 0.8158844765342961,
|
10970 |
"eval_loss": 0.7026161551475525,
|
10971 |
-
"eval_runtime": 0.
|
10972 |
-
"eval_samples_per_second":
|
10973 |
-
"eval_steps_per_second": 37.
|
10974 |
"step": 14700
|
10975 |
},
|
10976 |
{
|
@@ -11110,9 +11110,9 @@
|
|
11110 |
"epoch": 76.0,
|
11111 |
"eval_accuracy": 0.9169675090252708,
|
11112 |
"eval_loss": 0.40481600165367126,
|
11113 |
-
"eval_runtime": 0.
|
11114 |
-
"eval_samples_per_second":
|
11115 |
-
"eval_steps_per_second": 37.
|
11116 |
"step": 14896
|
11117 |
},
|
11118 |
{
|
@@ -11259,9 +11259,9 @@
|
|
11259 |
"epoch": 77.0,
|
11260 |
"eval_accuracy": 0.8844765342960289,
|
11261 |
"eval_loss": 0.48912858963012695,
|
11262 |
-
"eval_runtime": 0.
|
11263 |
-
"eval_samples_per_second":
|
11264 |
-
"eval_steps_per_second": 37.
|
11265 |
"step": 15092
|
11266 |
},
|
11267 |
{
|
@@ -11401,9 +11401,9 @@
|
|
11401 |
"epoch": 78.0,
|
11402 |
"eval_accuracy": 0.8772563176895307,
|
11403 |
"eval_loss": 0.42159637808799744,
|
11404 |
-
"eval_runtime": 0.
|
11405 |
-
"eval_samples_per_second":
|
11406 |
-
"eval_steps_per_second":
|
11407 |
"step": 15288
|
11408 |
},
|
11409 |
{
|
@@ -11550,9 +11550,9 @@
|
|
11550 |
"epoch": 79.0,
|
11551 |
"eval_accuracy": 0.8953068592057761,
|
11552 |
"eval_loss": 0.2720978558063507,
|
11553 |
-
"eval_runtime": 0.
|
11554 |
-
"eval_samples_per_second":
|
11555 |
-
"eval_steps_per_second": 37.
|
11556 |
"step": 15484
|
11557 |
},
|
11558 |
{
|
@@ -11699,9 +11699,9 @@
|
|
11699 |
"epoch": 80.0,
|
11700 |
"eval_accuracy": 0.8483754512635379,
|
11701 |
"eval_loss": 0.42701977491378784,
|
11702 |
-
"eval_runtime": 0.
|
11703 |
-
"eval_samples_per_second":
|
11704 |
-
"eval_steps_per_second":
|
11705 |
"step": 15680
|
11706 |
},
|
11707 |
{
|
@@ -11841,9 +11841,9 @@
|
|
11841 |
"epoch": 81.0,
|
11842 |
"eval_accuracy": 0.7833935018050542,
|
11843 |
"eval_loss": 0.763225793838501,
|
11844 |
-
"eval_runtime": 0.
|
11845 |
-
"eval_samples_per_second":
|
11846 |
-
"eval_steps_per_second": 37.
|
11847 |
"step": 15876
|
11848 |
},
|
11849 |
{
|
@@ -11990,9 +11990,9 @@
|
|
11990 |
"epoch": 82.0,
|
11991 |
"eval_accuracy": 0.9025270758122743,
|
11992 |
"eval_loss": 0.3249270021915436,
|
11993 |
-
"eval_runtime": 0.
|
11994 |
-
"eval_samples_per_second":
|
11995 |
-
"eval_steps_per_second":
|
11996 |
"step": 16072
|
11997 |
},
|
11998 |
{
|
@@ -12132,9 +12132,9 @@
|
|
12132 |
"epoch": 83.0,
|
12133 |
"eval_accuracy": 0.8989169675090253,
|
12134 |
"eval_loss": 0.38384127616882324,
|
12135 |
-
"eval_runtime": 0.
|
12136 |
-
"eval_samples_per_second":
|
12137 |
-
"eval_steps_per_second": 37.
|
12138 |
"step": 16268
|
12139 |
},
|
12140 |
{
|
@@ -12281,9 +12281,9 @@
|
|
12281 |
"epoch": 84.0,
|
12282 |
"eval_accuracy": 0.9205776173285198,
|
12283 |
"eval_loss": 0.3329784572124481,
|
12284 |
-
"eval_runtime": 0.
|
12285 |
-
"eval_samples_per_second":
|
12286 |
-
"eval_steps_per_second": 37.
|
12287 |
"step": 16464
|
12288 |
},
|
12289 |
{
|
@@ -12430,9 +12430,9 @@
|
|
12430 |
"epoch": 85.0,
|
12431 |
"eval_accuracy": 0.8700361010830325,
|
12432 |
"eval_loss": 0.32456666231155396,
|
12433 |
-
"eval_runtime": 0.
|
12434 |
-
"eval_samples_per_second":
|
12435 |
-
"eval_steps_per_second": 37.
|
12436 |
"step": 16660
|
12437 |
},
|
12438 |
{
|
@@ -12572,9 +12572,9 @@
|
|
12572 |
"epoch": 86.0,
|
12573 |
"eval_accuracy": 0.8736462093862816,
|
12574 |
"eval_loss": 0.3710058927536011,
|
12575 |
-
"eval_runtime": 0.
|
12576 |
-
"eval_samples_per_second":
|
12577 |
-
"eval_steps_per_second":
|
12578 |
"step": 16856
|
12579 |
},
|
12580 |
{
|
@@ -12721,9 +12721,9 @@
|
|
12721 |
"epoch": 87.0,
|
12722 |
"eval_accuracy": 0.9061371841155235,
|
12723 |
"eval_loss": 0.33839184045791626,
|
12724 |
-
"eval_runtime": 0.
|
12725 |
-
"eval_samples_per_second":
|
12726 |
-
"eval_steps_per_second":
|
12727 |
"step": 17052
|
12728 |
},
|
12729 |
{
|
@@ -12863,9 +12863,9 @@
|
|
12863 |
"epoch": 88.0,
|
12864 |
"eval_accuracy": 0.9097472924187726,
|
12865 |
"eval_loss": 0.3703186511993408,
|
12866 |
-
"eval_runtime": 0.
|
12867 |
-
"eval_samples_per_second":
|
12868 |
-
"eval_steps_per_second":
|
12869 |
"step": 17248
|
12870 |
},
|
12871 |
{
|
@@ -13012,9 +13012,9 @@
|
|
13012 |
"epoch": 89.0,
|
13013 |
"eval_accuracy": 0.8592057761732852,
|
13014 |
"eval_loss": 0.5013492703437805,
|
13015 |
-
"eval_runtime": 0.
|
13016 |
-
"eval_samples_per_second":
|
13017 |
-
"eval_steps_per_second":
|
13018 |
"step": 17444
|
13019 |
},
|
13020 |
{
|
@@ -13161,9 +13161,9 @@
|
|
13161 |
"epoch": 90.0,
|
13162 |
"eval_accuracy": 0.8989169675090253,
|
13163 |
"eval_loss": 0.3456423580646515,
|
13164 |
-
"eval_runtime":
|
13165 |
-
"eval_samples_per_second":
|
13166 |
-
"eval_steps_per_second":
|
13167 |
"step": 17640
|
13168 |
},
|
13169 |
{
|
@@ -13303,9 +13303,9 @@
|
|
13303 |
"epoch": 91.0,
|
13304 |
"eval_accuracy": 0.8880866425992779,
|
13305 |
"eval_loss": 0.3798539340496063,
|
13306 |
-
"eval_runtime": 0.
|
13307 |
-
"eval_samples_per_second":
|
13308 |
-
"eval_steps_per_second":
|
13309 |
"step": 17836
|
13310 |
},
|
13311 |
{
|
@@ -13452,9 +13452,9 @@
|
|
13452 |
"epoch": 92.0,
|
13453 |
"eval_accuracy": 0.9061371841155235,
|
13454 |
"eval_loss": 0.32391440868377686,
|
13455 |
-
"eval_runtime": 0.
|
13456 |
-
"eval_samples_per_second": 278
|
13457 |
-
"eval_steps_per_second":
|
13458 |
"step": 18032
|
13459 |
},
|
13460 |
{
|
@@ -13594,9 +13594,9 @@
|
|
13594 |
"epoch": 93.0,
|
13595 |
"eval_accuracy": 0.8989169675090253,
|
13596 |
"eval_loss": 0.4861180782318115,
|
13597 |
-
"eval_runtime": 0.
|
13598 |
-
"eval_samples_per_second":
|
13599 |
-
"eval_steps_per_second":
|
13600 |
"step": 18228
|
13601 |
},
|
13602 |
{
|
@@ -13743,9 +13743,9 @@
|
|
13743 |
"epoch": 94.0,
|
13744 |
"eval_accuracy": 0.8736462093862816,
|
13745 |
"eval_loss": 0.4443919062614441,
|
13746 |
-
"eval_runtime": 0.
|
13747 |
-
"eval_samples_per_second":
|
13748 |
-
"eval_steps_per_second": 37.
|
13749 |
"step": 18424
|
13750 |
},
|
13751 |
{
|
@@ -13892,9 +13892,9 @@
|
|
13892 |
"epoch": 95.0,
|
13893 |
"eval_accuracy": 0.8844765342960289,
|
13894 |
"eval_loss": 0.3712524473667145,
|
13895 |
-
"eval_runtime": 0.
|
13896 |
-
"eval_samples_per_second":
|
13897 |
-
"eval_steps_per_second": 37.
|
13898 |
"step": 18620
|
13899 |
},
|
13900 |
{
|
@@ -14034,9 +14034,9 @@
|
|
14034 |
"epoch": 96.0,
|
14035 |
"eval_accuracy": 0.8303249097472925,
|
14036 |
"eval_loss": 0.427941232919693,
|
14037 |
-
"eval_runtime":
|
14038 |
-
"eval_samples_per_second":
|
14039 |
-
"eval_steps_per_second":
|
14040 |
"step": 18816
|
14041 |
},
|
14042 |
{
|
@@ -14183,9 +14183,9 @@
|
|
14183 |
"epoch": 97.0,
|
14184 |
"eval_accuracy": 0.8411552346570397,
|
14185 |
"eval_loss": 0.6587985157966614,
|
14186 |
-
"eval_runtime": 0.
|
14187 |
-
"eval_samples_per_second":
|
14188 |
-
"eval_steps_per_second": 37.
|
14189 |
"step": 19012
|
14190 |
},
|
14191 |
{
|
@@ -14325,9 +14325,9 @@
|
|
14325 |
"epoch": 98.0,
|
14326 |
"eval_accuracy": 0.8267148014440433,
|
14327 |
"eval_loss": 0.66323322057724,
|
14328 |
-
"eval_runtime": 0.
|
14329 |
-
"eval_samples_per_second":
|
14330 |
-
"eval_steps_per_second": 37.
|
14331 |
"step": 19208
|
14332 |
},
|
14333 |
{
|
@@ -14474,9 +14474,9 @@
|
|
14474 |
"epoch": 99.0,
|
14475 |
"eval_accuracy": 0.8808664259927798,
|
14476 |
"eval_loss": 0.4641692638397217,
|
14477 |
-
"eval_runtime": 0.
|
14478 |
-
"eval_samples_per_second":
|
14479 |
-
"eval_steps_per_second": 37.
|
14480 |
"step": 19404
|
14481 |
},
|
14482 |
{
|
@@ -14623,9 +14623,9 @@
|
|
14623 |
"epoch": 100.0,
|
14624 |
"eval_accuracy": 0.8808664259927798,
|
14625 |
"eval_loss": 0.3624129593372345,
|
14626 |
-
"eval_runtime":
|
14627 |
-
"eval_samples_per_second":
|
14628 |
-
"eval_steps_per_second":
|
14629 |
"step": 19600
|
14630 |
},
|
14631 |
{
|
@@ -14633,9 +14633,9 @@
|
|
14633 |
"step": 19600,
|
14634 |
"total_flos": 5.678990728814592e+17,
|
14635 |
"train_loss": 0.30055975163317455,
|
14636 |
-
"train_runtime":
|
14637 |
-
"train_samples_per_second":
|
14638 |
-
"train_steps_per_second": 20.
|
14639 |
}
|
14640 |
],
|
14641 |
"logging_steps": 10,
|
|
|
1 |
{
|
2 |
"best_metric": 0.26566287875175476,
|
3 |
+
"best_model_checkpoint": "./cocoa_outputs_resnet/checkpoint-6468",
|
4 |
"epoch": 100.0,
|
5 |
"eval_steps": 500,
|
6 |
"global_step": 19600,
|
|
|
145 |
"epoch": 1.0,
|
146 |
"eval_accuracy": 0.5595667870036101,
|
147 |
"eval_loss": 1.5222723484039307,
|
148 |
+
"eval_runtime": 0.9569,
|
149 |
+
"eval_samples_per_second": 289.486,
|
150 |
+
"eval_steps_per_second": 36.578,
|
151 |
"step": 196
|
152 |
},
|
153 |
{
|
|
|
294 |
"epoch": 2.0,
|
295 |
"eval_accuracy": 0.8303249097472925,
|
296 |
"eval_loss": 0.8974758386611938,
|
297 |
+
"eval_runtime": 0.934,
|
298 |
+
"eval_samples_per_second": 296.569,
|
299 |
+
"eval_steps_per_second": 37.473,
|
300 |
"step": 392
|
301 |
},
|
302 |
{
|
|
|
436 |
"epoch": 3.0,
|
437 |
"eval_accuracy": 0.8772563176895307,
|
438 |
"eval_loss": 0.6563544273376465,
|
439 |
+
"eval_runtime": 0.936,
|
440 |
+
"eval_samples_per_second": 295.927,
|
441 |
+
"eval_steps_per_second": 37.391,
|
442 |
"step": 588
|
443 |
},
|
444 |
{
|
|
|
585 |
"epoch": 4.0,
|
586 |
"eval_accuracy": 0.8339350180505415,
|
587 |
"eval_loss": 0.6841569542884827,
|
588 |
+
"eval_runtime": 0.9273,
|
589 |
+
"eval_samples_per_second": 298.728,
|
590 |
+
"eval_steps_per_second": 37.745,
|
591 |
"step": 784
|
592 |
},
|
593 |
{
|
|
|
734 |
"epoch": 5.0,
|
735 |
"eval_accuracy": 0.8808664259927798,
|
736 |
"eval_loss": 0.48941850662231445,
|
737 |
+
"eval_runtime": 0.935,
|
738 |
+
"eval_samples_per_second": 296.252,
|
739 |
+
"eval_steps_per_second": 37.433,
|
740 |
"step": 980
|
741 |
},
|
742 |
{
|
|
|
876 |
"epoch": 6.0,
|
877 |
"eval_accuracy": 0.8736462093862816,
|
878 |
"eval_loss": 0.41603580117225647,
|
879 |
+
"eval_runtime": 0.9296,
|
880 |
+
"eval_samples_per_second": 297.99,
|
881 |
+
"eval_steps_per_second": 37.652,
|
882 |
"step": 1176
|
883 |
},
|
884 |
{
|
|
|
1025 |
"epoch": 7.0,
|
1026 |
"eval_accuracy": 0.8844765342960289,
|
1027 |
"eval_loss": 0.40221381187438965,
|
1028 |
+
"eval_runtime": 0.9298,
|
1029 |
+
"eval_samples_per_second": 297.902,
|
1030 |
+
"eval_steps_per_second": 37.641,
|
1031 |
"step": 1372
|
1032 |
},
|
1033 |
{
|
|
|
1167 |
"epoch": 8.0,
|
1168 |
"eval_accuracy": 0.8411552346570397,
|
1169 |
"eval_loss": 0.4939042627811432,
|
1170 |
+
"eval_runtime": 0.9311,
|
1171 |
+
"eval_samples_per_second": 297.494,
|
1172 |
+
"eval_steps_per_second": 37.589,
|
1173 |
"step": 1568
|
1174 |
},
|
1175 |
{
|
|
|
1316 |
"epoch": 9.0,
|
1317 |
"eval_accuracy": 0.8772563176895307,
|
1318 |
"eval_loss": 0.35403916239738464,
|
1319 |
+
"eval_runtime": 0.9315,
|
1320 |
+
"eval_samples_per_second": 297.362,
|
1321 |
+
"eval_steps_per_second": 37.573,
|
1322 |
"step": 1764
|
1323 |
},
|
1324 |
{
|
|
|
1465 |
"epoch": 10.0,
|
1466 |
"eval_accuracy": 0.8953068592057761,
|
1467 |
"eval_loss": 0.349290668964386,
|
1468 |
+
"eval_runtime": 0.9365,
|
1469 |
+
"eval_samples_per_second": 295.793,
|
1470 |
+
"eval_steps_per_second": 37.375,
|
1471 |
"step": 1960
|
1472 |
},
|
1473 |
{
|
|
|
1607 |
"epoch": 11.0,
|
1608 |
"eval_accuracy": 0.776173285198556,
|
1609 |
"eval_loss": 0.7928438186645508,
|
1610 |
+
"eval_runtime": 0.9321,
|
1611 |
+
"eval_samples_per_second": 297.189,
|
1612 |
+
"eval_steps_per_second": 37.551,
|
1613 |
"step": 2156
|
1614 |
},
|
1615 |
{
|
|
|
1756 |
"epoch": 12.0,
|
1757 |
"eval_accuracy": 0.296028880866426,
|
1758 |
"eval_loss": 2.06593918800354,
|
1759 |
+
"eval_runtime": 0.9947,
|
1760 |
+
"eval_samples_per_second": 278.482,
|
1761 |
+
"eval_steps_per_second": 35.187,
|
1762 |
"step": 2352
|
1763 |
},
|
1764 |
{
|
|
|
1898 |
"epoch": 13.0,
|
1899 |
"eval_accuracy": 0.851985559566787,
|
1900 |
"eval_loss": 0.44439464807510376,
|
1901 |
+
"eval_runtime": 0.9289,
|
1902 |
+
"eval_samples_per_second": 298.212,
|
1903 |
+
"eval_steps_per_second": 37.68,
|
1904 |
"step": 2548
|
1905 |
},
|
1906 |
{
|
|
|
2047 |
"epoch": 14.0,
|
2048 |
"eval_accuracy": 0.8736462093862816,
|
2049 |
"eval_loss": 0.46400919556617737,
|
2050 |
+
"eval_runtime": 0.9937,
|
2051 |
+
"eval_samples_per_second": 278.754,
|
2052 |
+
"eval_steps_per_second": 35.222,
|
2053 |
"step": 2744
|
2054 |
},
|
2055 |
{
|
|
|
2196 |
"epoch": 15.0,
|
2197 |
"eval_accuracy": 0.8772563176895307,
|
2198 |
"eval_loss": 0.37753719091415405,
|
2199 |
+
"eval_runtime": 0.9317,
|
2200 |
+
"eval_samples_per_second": 297.316,
|
2201 |
+
"eval_steps_per_second": 37.567,
|
2202 |
"step": 2940
|
2203 |
},
|
2204 |
{
|
|
|
2338 |
"epoch": 16.0,
|
2339 |
"eval_accuracy": 0.8880866425992779,
|
2340 |
"eval_loss": 0.3519056737422943,
|
2341 |
+
"eval_runtime": 0.9334,
|
2342 |
+
"eval_samples_per_second": 296.766,
|
2343 |
+
"eval_steps_per_second": 37.498,
|
2344 |
"step": 3136
|
2345 |
},
|
2346 |
{
|
|
|
2487 |
"epoch": 17.0,
|
2488 |
"eval_accuracy": 0.9061371841155235,
|
2489 |
"eval_loss": 0.33103030920028687,
|
2490 |
+
"eval_runtime": 0.9376,
|
2491 |
+
"eval_samples_per_second": 295.446,
|
2492 |
+
"eval_steps_per_second": 37.331,
|
2493 |
"step": 3332
|
2494 |
},
|
2495 |
{
|
|
|
2629 |
"epoch": 18.0,
|
2630 |
"eval_accuracy": 0.8916967509025271,
|
2631 |
"eval_loss": 0.34751203656196594,
|
2632 |
+
"eval_runtime": 0.9366,
|
2633 |
+
"eval_samples_per_second": 295.765,
|
2634 |
+
"eval_steps_per_second": 37.371,
|
2635 |
"step": 3528
|
2636 |
},
|
2637 |
{
|
|
|
2778 |
"epoch": 19.0,
|
2779 |
"eval_accuracy": 0.8592057761732852,
|
2780 |
"eval_loss": 0.38391339778900146,
|
2781 |
+
"eval_runtime": 0.9352,
|
2782 |
+
"eval_samples_per_second": 296.2,
|
2783 |
+
"eval_steps_per_second": 37.426,
|
2784 |
"step": 3724
|
2785 |
},
|
2786 |
{
|
|
|
2927 |
"epoch": 20.0,
|
2928 |
"eval_accuracy": 0.9133574007220217,
|
2929 |
"eval_loss": 0.3031846880912781,
|
2930 |
+
"eval_runtime": 0.9346,
|
2931 |
+
"eval_samples_per_second": 296.374,
|
2932 |
+
"eval_steps_per_second": 37.448,
|
2933 |
"step": 3920
|
2934 |
},
|
2935 |
{
|
|
|
3069 |
"epoch": 21.0,
|
3070 |
"eval_accuracy": 0.851985559566787,
|
3071 |
"eval_loss": 0.4246116876602173,
|
3072 |
+
"eval_runtime": 0.9314,
|
3073 |
+
"eval_samples_per_second": 297.413,
|
3074 |
+
"eval_steps_per_second": 37.579,
|
3075 |
"step": 4116
|
3076 |
},
|
3077 |
{
|
|
|
3218 |
"epoch": 22.0,
|
3219 |
"eval_accuracy": 0.8989169675090253,
|
3220 |
"eval_loss": 0.29509276151657104,
|
3221 |
+
"eval_runtime": 0.9307,
|
3222 |
+
"eval_samples_per_second": 297.612,
|
3223 |
+
"eval_steps_per_second": 37.604,
|
3224 |
"step": 4312
|
3225 |
},
|
3226 |
{
|
|
|
3360 |
"epoch": 23.0,
|
3361 |
"eval_accuracy": 0.851985559566787,
|
3362 |
"eval_loss": 0.4356595277786255,
|
3363 |
+
"eval_runtime": 0.9603,
|
3364 |
+
"eval_samples_per_second": 288.437,
|
3365 |
+
"eval_steps_per_second": 36.445,
|
3366 |
"step": 4508
|
3367 |
},
|
3368 |
{
|
|
|
3509 |
"epoch": 24.0,
|
3510 |
"eval_accuracy": 0.8916967509025271,
|
3511 |
"eval_loss": 0.399036169052124,
|
3512 |
+
"eval_runtime": 0.9342,
|
3513 |
+
"eval_samples_per_second": 296.5,
|
3514 |
+
"eval_steps_per_second": 37.464,
|
3515 |
"step": 4704
|
3516 |
},
|
3517 |
{
|
|
|
3658 |
"epoch": 25.0,
|
3659 |
"eval_accuracy": 0.9097472924187726,
|
3660 |
"eval_loss": 0.35359257459640503,
|
3661 |
+
"eval_runtime": 0.9646,
|
3662 |
+
"eval_samples_per_second": 287.175,
|
3663 |
+
"eval_steps_per_second": 36.286,
|
3664 |
"step": 4900
|
3665 |
},
|
3666 |
{
|
|
|
3800 |
"epoch": 26.0,
|
3801 |
"eval_accuracy": 0.8592057761732852,
|
3802 |
"eval_loss": 0.4166140854358673,
|
3803 |
+
"eval_runtime": 0.9729,
|
3804 |
+
"eval_samples_per_second": 284.728,
|
3805 |
+
"eval_steps_per_second": 35.976,
|
3806 |
"step": 5096
|
3807 |
},
|
3808 |
{
|
|
|
3949 |
"epoch": 27.0,
|
3950 |
"eval_accuracy": 0.851985559566787,
|
3951 |
"eval_loss": 0.4353993237018585,
|
3952 |
+
"eval_runtime": 0.9398,
|
3953 |
+
"eval_samples_per_second": 294.757,
|
3954 |
+
"eval_steps_per_second": 37.244,
|
3955 |
"step": 5292
|
3956 |
},
|
3957 |
{
|
|
|
4091 |
"epoch": 28.0,
|
4092 |
"eval_accuracy": 0.8592057761732852,
|
4093 |
"eval_loss": 0.4088672697544098,
|
4094 |
+
"eval_runtime": 0.9406,
|
4095 |
+
"eval_samples_per_second": 294.489,
|
4096 |
+
"eval_steps_per_second": 37.21,
|
4097 |
"step": 5488
|
4098 |
},
|
4099 |
{
|
|
|
4240 |
"epoch": 29.0,
|
4241 |
"eval_accuracy": 0.8231046931407943,
|
4242 |
"eval_loss": 0.4787161946296692,
|
4243 |
+
"eval_runtime": 0.933,
|
4244 |
+
"eval_samples_per_second": 296.9,
|
4245 |
+
"eval_steps_per_second": 37.514,
|
4246 |
"step": 5684
|
4247 |
},
|
4248 |
{
|
|
|
4389 |
"epoch": 30.0,
|
4390 |
"eval_accuracy": 0.9097472924187726,
|
4391 |
"eval_loss": 0.3165305256843567,
|
4392 |
+
"eval_runtime": 0.9292,
|
4393 |
+
"eval_samples_per_second": 298.12,
|
4394 |
+
"eval_steps_per_second": 37.669,
|
4395 |
"step": 5880
|
4396 |
},
|
4397 |
{
|
|
|
4531 |
"epoch": 31.0,
|
4532 |
"eval_accuracy": 0.9133574007220217,
|
4533 |
"eval_loss": 0.31053850054740906,
|
4534 |
+
"eval_runtime": 0.9345,
|
4535 |
+
"eval_samples_per_second": 296.427,
|
4536 |
+
"eval_steps_per_second": 37.455,
|
4537 |
"step": 6076
|
4538 |
},
|
4539 |
{
|
|
|
4680 |
"epoch": 32.0,
|
4681 |
"eval_accuracy": 0.9061371841155235,
|
4682 |
"eval_loss": 0.3559906780719757,
|
4683 |
+
"eval_runtime": 0.9353,
|
4684 |
+
"eval_samples_per_second": 296.174,
|
4685 |
+
"eval_steps_per_second": 37.423,
|
4686 |
"step": 6272
|
4687 |
},
|
4688 |
{
|
|
|
4822 |
"epoch": 33.0,
|
4823 |
"eval_accuracy": 0.9097472924187726,
|
4824 |
"eval_loss": 0.26566287875175476,
|
4825 |
+
"eval_runtime": 0.9334,
|
4826 |
+
"eval_samples_per_second": 296.762,
|
4827 |
+
"eval_steps_per_second": 37.497,
|
4828 |
"step": 6468
|
4829 |
},
|
4830 |
{
|
|
|
4971 |
"epoch": 34.0,
|
4972 |
"eval_accuracy": 0.9133574007220217,
|
4973 |
"eval_loss": 0.2679595947265625,
|
4974 |
+
"eval_runtime": 0.936,
|
4975 |
+
"eval_samples_per_second": 295.944,
|
4976 |
+
"eval_steps_per_second": 37.394,
|
4977 |
"step": 6664
|
4978 |
},
|
4979 |
{
|
|
|
5120 |
"epoch": 35.0,
|
5121 |
"eval_accuracy": 0.9061371841155235,
|
5122 |
"eval_loss": 0.3797638416290283,
|
5123 |
+
"eval_runtime": 0.9298,
|
5124 |
+
"eval_samples_per_second": 297.901,
|
5125 |
+
"eval_steps_per_second": 37.641,
|
5126 |
"step": 6860
|
5127 |
},
|
5128 |
{
|
|
|
5262 |
"epoch": 36.0,
|
5263 |
"eval_accuracy": 0.855595667870036,
|
5264 |
"eval_loss": 0.5098311305046082,
|
5265 |
+
"eval_runtime": 0.9428,
|
5266 |
+
"eval_samples_per_second": 293.818,
|
5267 |
+
"eval_steps_per_second": 37.125,
|
5268 |
"step": 7056
|
5269 |
},
|
5270 |
{
|
|
|
5411 |
"epoch": 37.0,
|
5412 |
"eval_accuracy": 0.8808664259927798,
|
5413 |
"eval_loss": 0.42190420627593994,
|
5414 |
+
"eval_runtime": 0.9304,
|
5415 |
+
"eval_samples_per_second": 297.732,
|
5416 |
+
"eval_steps_per_second": 37.62,
|
5417 |
"step": 7252
|
5418 |
},
|
5419 |
{
|
|
|
5553 |
"epoch": 38.0,
|
5554 |
"eval_accuracy": 0.9133574007220217,
|
5555 |
"eval_loss": 0.2851579189300537,
|
5556 |
+
"eval_runtime": 0.9753,
|
5557 |
+
"eval_samples_per_second": 284.019,
|
5558 |
+
"eval_steps_per_second": 35.887,
|
5559 |
"step": 7448
|
5560 |
},
|
5561 |
{
|
|
|
5702 |
"epoch": 39.0,
|
5703 |
"eval_accuracy": 0.8989169675090253,
|
5704 |
"eval_loss": 0.36030298471450806,
|
5705 |
+
"eval_runtime": 0.9403,
|
5706 |
+
"eval_samples_per_second": 294.598,
|
5707 |
+
"eval_steps_per_second": 37.224,
|
5708 |
"step": 7644
|
5709 |
},
|
5710 |
{
|
|
|
5851 |
"epoch": 40.0,
|
5852 |
"eval_accuracy": 0.8736462093862816,
|
5853 |
"eval_loss": 0.351894736289978,
|
5854 |
+
"eval_runtime": 0.9415,
|
5855 |
+
"eval_samples_per_second": 294.212,
|
5856 |
+
"eval_steps_per_second": 37.175,
|
5857 |
"step": 7840
|
5858 |
},
|
5859 |
{
|
|
|
5993 |
"epoch": 41.0,
|
5994 |
"eval_accuracy": 0.9025270758122743,
|
5995 |
"eval_loss": 0.3343473970890045,
|
5996 |
+
"eval_runtime": 0.9379,
|
5997 |
+
"eval_samples_per_second": 295.341,
|
5998 |
+
"eval_steps_per_second": 37.317,
|
5999 |
"step": 8036
|
6000 |
},
|
6001 |
{
|
|
|
6142 |
"epoch": 42.0,
|
6143 |
"eval_accuracy": 0.9169675090252708,
|
6144 |
"eval_loss": 0.3383941352367401,
|
6145 |
+
"eval_runtime": 0.9348,
|
6146 |
+
"eval_samples_per_second": 296.313,
|
6147 |
+
"eval_steps_per_second": 37.44,
|
6148 |
"step": 8232
|
6149 |
},
|
6150 |
{
|
|
|
6284 |
"epoch": 43.0,
|
6285 |
"eval_accuracy": 0.8772563176895307,
|
6286 |
"eval_loss": 0.40458711981773376,
|
6287 |
+
"eval_runtime": 0.9383,
|
6288 |
+
"eval_samples_per_second": 295.207,
|
6289 |
+
"eval_steps_per_second": 37.301,
|
6290 |
"step": 8428
|
6291 |
},
|
6292 |
{
|
|
|
6433 |
"epoch": 44.0,
|
6434 |
"eval_accuracy": 0.8916967509025271,
|
6435 |
"eval_loss": 0.39525121450424194,
|
6436 |
+
"eval_runtime": 0.9341,
|
6437 |
+
"eval_samples_per_second": 296.557,
|
6438 |
+
"eval_steps_per_second": 37.471,
|
6439 |
"step": 8624
|
6440 |
},
|
6441 |
{
|
|
|
6582 |
"epoch": 45.0,
|
6583 |
"eval_accuracy": 0.8592057761732852,
|
6584 |
"eval_loss": 0.5002943873405457,
|
6585 |
+
"eval_runtime": 0.9313,
|
6586 |
+
"eval_samples_per_second": 297.43,
|
6587 |
+
"eval_steps_per_second": 37.581,
|
6588 |
"step": 8820
|
6589 |
},
|
6590 |
{
|
|
|
6724 |
"epoch": 46.0,
|
6725 |
"eval_accuracy": 0.9169675090252708,
|
6726 |
"eval_loss": 0.3231888711452484,
|
6727 |
+
"eval_runtime": 0.9353,
|
6728 |
+
"eval_samples_per_second": 296.162,
|
6729 |
+
"eval_steps_per_second": 37.421,
|
6730 |
"step": 9016
|
6731 |
},
|
6732 |
{
|
|
|
6873 |
"epoch": 47.0,
|
6874 |
"eval_accuracy": 0.9169675090252708,
|
6875 |
"eval_loss": 0.3112559914588928,
|
6876 |
+
"eval_runtime": 0.9287,
|
6877 |
+
"eval_samples_per_second": 298.262,
|
6878 |
+
"eval_steps_per_second": 37.687,
|
6879 |
"step": 9212
|
6880 |
},
|
6881 |
{
|
|
|
7015 |
"epoch": 48.0,
|
7016 |
"eval_accuracy": 0.855595667870036,
|
7017 |
"eval_loss": 0.4494384229183197,
|
7018 |
+
"eval_runtime": 0.928,
|
7019 |
+
"eval_samples_per_second": 298.494,
|
7020 |
+
"eval_steps_per_second": 37.716,
|
7021 |
"step": 9408
|
7022 |
},
|
7023 |
{
|
|
|
7164 |
"epoch": 49.0,
|
7165 |
"eval_accuracy": 0.9205776173285198,
|
7166 |
"eval_loss": 0.37217509746551514,
|
7167 |
+
"eval_runtime": 0.9297,
|
7168 |
+
"eval_samples_per_second": 297.952,
|
7169 |
+
"eval_steps_per_second": 37.647,
|
7170 |
"step": 9604
|
7171 |
},
|
7172 |
{
|
|
|
7313 |
"epoch": 50.0,
|
7314 |
"eval_accuracy": 0.9097472924187726,
|
7315 |
"eval_loss": 0.2852139472961426,
|
7316 |
+
"eval_runtime": 0.9306,
|
7317 |
+
"eval_samples_per_second": 297.668,
|
7318 |
+
"eval_steps_per_second": 37.611,
|
7319 |
"step": 9800
|
7320 |
},
|
7321 |
{
|
|
|
7455 |
"epoch": 51.0,
|
7456 |
"eval_accuracy": 0.8628158844765343,
|
7457 |
"eval_loss": 0.4137951135635376,
|
7458 |
+
"eval_runtime": 0.9371,
|
7459 |
+
"eval_samples_per_second": 295.604,
|
7460 |
+
"eval_steps_per_second": 37.351,
|
7461 |
"step": 9996
|
7462 |
},
|
7463 |
{
|
|
|
7604 |
"epoch": 52.0,
|
7605 |
"eval_accuracy": 0.8953068592057761,
|
7606 |
"eval_loss": 0.34130236506462097,
|
7607 |
+
"eval_runtime": 0.9387,
|
7608 |
+
"eval_samples_per_second": 295.092,
|
7609 |
+
"eval_steps_per_second": 37.286,
|
7610 |
"step": 10192
|
7611 |
},
|
7612 |
{
|
|
|
7746 |
"epoch": 53.0,
|
7747 |
"eval_accuracy": 0.9169675090252708,
|
7748 |
"eval_loss": 0.30462250113487244,
|
7749 |
+
"eval_runtime": 0.9357,
|
7750 |
+
"eval_samples_per_second": 296.019,
|
7751 |
+
"eval_steps_per_second": 37.403,
|
7752 |
"step": 10388
|
7753 |
},
|
7754 |
{
|
|
|
7895 |
"epoch": 54.0,
|
7896 |
"eval_accuracy": 0.8989169675090253,
|
7897 |
"eval_loss": 0.2849152684211731,
|
7898 |
+
"eval_runtime": 0.9334,
|
7899 |
+
"eval_samples_per_second": 296.775,
|
7900 |
+
"eval_steps_per_second": 37.499,
|
7901 |
"step": 10584
|
7902 |
},
|
7903 |
{
|
|
|
8044 |
"epoch": 55.0,
|
8045 |
"eval_accuracy": 0.9133574007220217,
|
8046 |
"eval_loss": 0.35168057680130005,
|
8047 |
+
"eval_runtime": 0.9361,
|
8048 |
+
"eval_samples_per_second": 295.907,
|
8049 |
+
"eval_steps_per_second": 37.389,
|
8050 |
"step": 10780
|
8051 |
},
|
8052 |
{
|
|
|
8186 |
"epoch": 56.0,
|
8187 |
"eval_accuracy": 0.9025270758122743,
|
8188 |
"eval_loss": 0.45381447672843933,
|
8189 |
+
"eval_runtime": 0.9344,
|
8190 |
+
"eval_samples_per_second": 296.45,
|
8191 |
+
"eval_steps_per_second": 37.458,
|
8192 |
"step": 10976
|
8193 |
},
|
8194 |
{
|
|
|
8335 |
"epoch": 57.0,
|
8336 |
"eval_accuracy": 0.8592057761732852,
|
8337 |
"eval_loss": 0.44916799664497375,
|
8338 |
+
"eval_runtime": 0.9373,
|
8339 |
+
"eval_samples_per_second": 295.53,
|
8340 |
+
"eval_steps_per_second": 37.341,
|
8341 |
"step": 11172
|
8342 |
},
|
8343 |
{
|
|
|
8477 |
"epoch": 58.0,
|
8478 |
"eval_accuracy": 0.8628158844765343,
|
8479 |
"eval_loss": 0.4738902747631073,
|
8480 |
+
"eval_runtime": 0.9332,
|
8481 |
+
"eval_samples_per_second": 296.824,
|
8482 |
+
"eval_steps_per_second": 37.505,
|
8483 |
"step": 11368
|
8484 |
},
|
8485 |
{
|
|
|
8626 |
"epoch": 59.0,
|
8627 |
"eval_accuracy": 0.9205776173285198,
|
8628 |
"eval_loss": 0.2831103205680847,
|
8629 |
+
"eval_runtime": 0.9316,
|
8630 |
+
"eval_samples_per_second": 297.324,
|
8631 |
+
"eval_steps_per_second": 37.568,
|
8632 |
"step": 11564
|
8633 |
},
|
8634 |
{
|
|
|
8775 |
"epoch": 60.0,
|
8776 |
"eval_accuracy": 0.9205776173285198,
|
8777 |
"eval_loss": 0.34654152393341064,
|
8778 |
+
"eval_runtime": 0.9298,
|
8779 |
+
"eval_samples_per_second": 297.899,
|
8780 |
+
"eval_steps_per_second": 37.641,
|
8781 |
"step": 11760
|
8782 |
},
|
8783 |
{
|
|
|
8917 |
"epoch": 61.0,
|
8918 |
"eval_accuracy": 0.9314079422382672,
|
8919 |
"eval_loss": 0.28843551874160767,
|
8920 |
+
"eval_runtime": 0.938,
|
8921 |
+
"eval_samples_per_second": 295.31,
|
8922 |
+
"eval_steps_per_second": 37.314,
|
8923 |
"step": 11956
|
8924 |
},
|
8925 |
{
|
|
|
9066 |
"epoch": 62.0,
|
9067 |
"eval_accuracy": 0.8447653429602888,
|
9068 |
"eval_loss": 0.4874745309352875,
|
9069 |
+
"eval_runtime": 0.935,
|
9070 |
+
"eval_samples_per_second": 296.251,
|
9071 |
+
"eval_steps_per_second": 37.432,
|
9072 |
"step": 12152
|
9073 |
},
|
9074 |
{
|
|
|
9208 |
"epoch": 63.0,
|
9209 |
"eval_accuracy": 0.9061371841155235,
|
9210 |
"eval_loss": 0.3988655209541321,
|
9211 |
+
"eval_runtime": 0.9339,
|
9212 |
+
"eval_samples_per_second": 296.617,
|
9213 |
+
"eval_steps_per_second": 37.479,
|
9214 |
"step": 12348
|
9215 |
},
|
9216 |
{
|
|
|
9357 |
"epoch": 64.0,
|
9358 |
"eval_accuracy": 0.851985559566787,
|
9359 |
"eval_loss": 0.5952923893928528,
|
9360 |
+
"eval_runtime": 0.9334,
|
9361 |
+
"eval_samples_per_second": 296.767,
|
9362 |
+
"eval_steps_per_second": 37.498,
|
9363 |
"step": 12544
|
9364 |
},
|
9365 |
{
|
|
|
9506 |
"epoch": 65.0,
|
9507 |
"eval_accuracy": 0.927797833935018,
|
9508 |
"eval_loss": 0.2953914701938629,
|
9509 |
+
"eval_runtime": 0.9948,
|
9510 |
+
"eval_samples_per_second": 278.444,
|
9511 |
+
"eval_steps_per_second": 35.183,
|
9512 |
"step": 12740
|
9513 |
},
|
9514 |
{
|
|
|
9648 |
"epoch": 66.0,
|
9649 |
"eval_accuracy": 0.851985559566787,
|
9650 |
"eval_loss": 0.5033073425292969,
|
9651 |
+
"eval_runtime": 0.9324,
|
9652 |
+
"eval_samples_per_second": 297.09,
|
9653 |
+
"eval_steps_per_second": 37.538,
|
9654 |
"step": 12936
|
9655 |
},
|
9656 |
{
|
|
|
9797 |
"epoch": 67.0,
|
9798 |
"eval_accuracy": 0.8808664259927798,
|
9799 |
"eval_loss": 0.41321179270744324,
|
9800 |
+
"eval_runtime": 0.9337,
|
9801 |
+
"eval_samples_per_second": 296.681,
|
9802 |
+
"eval_steps_per_second": 37.487,
|
9803 |
"step": 13132
|
9804 |
},
|
9805 |
{
|
|
|
9939 |
"epoch": 68.0,
|
9940 |
"eval_accuracy": 0.9169675090252708,
|
9941 |
"eval_loss": 0.37430626153945923,
|
9942 |
+
"eval_runtime": 0.9326,
|
9943 |
+
"eval_samples_per_second": 297.033,
|
9944 |
+
"eval_steps_per_second": 37.531,
|
9945 |
"step": 13328
|
9946 |
},
|
9947 |
{
|
|
|
10088 |
"epoch": 69.0,
|
10089 |
"eval_accuracy": 0.776173285198556,
|
10090 |
"eval_loss": 0.6423271298408508,
|
10091 |
+
"eval_runtime": 0.9344,
|
10092 |
+
"eval_samples_per_second": 296.457,
|
10093 |
+
"eval_steps_per_second": 37.458,
|
10094 |
"step": 13524
|
10095 |
},
|
10096 |
{
|
|
|
10237 |
"epoch": 70.0,
|
10238 |
"eval_accuracy": 0.8014440433212996,
|
10239 |
"eval_loss": 0.5979345440864563,
|
10240 |
+
"eval_runtime": 0.9413,
|
10241 |
+
"eval_samples_per_second": 294.271,
|
10242 |
+
"eval_steps_per_second": 37.182,
|
10243 |
"step": 13720
|
10244 |
},
|
10245 |
{
|
|
|
10379 |
"epoch": 71.0,
|
10380 |
"eval_accuracy": 0.8989169675090253,
|
10381 |
"eval_loss": 0.43981537222862244,
|
10382 |
+
"eval_runtime": 0.9369,
|
10383 |
+
"eval_samples_per_second": 295.663,
|
10384 |
+
"eval_steps_per_second": 37.358,
|
10385 |
"step": 13916
|
10386 |
},
|
10387 |
{
|
|
|
10528 |
"epoch": 72.0,
|
10529 |
"eval_accuracy": 0.8231046931407943,
|
10530 |
"eval_loss": 0.5633912086486816,
|
10531 |
+
"eval_runtime": 0.9331,
|
10532 |
+
"eval_samples_per_second": 296.846,
|
10533 |
+
"eval_steps_per_second": 37.508,
|
10534 |
"step": 14112
|
10535 |
},
|
10536 |
{
|
|
|
10670 |
"epoch": 73.0,
|
10671 |
"eval_accuracy": 0.776173285198556,
|
10672 |
"eval_loss": 0.620398223400116,
|
10673 |
+
"eval_runtime": 0.9369,
|
10674 |
+
"eval_samples_per_second": 295.645,
|
10675 |
+
"eval_steps_per_second": 37.356,
|
10676 |
"step": 14308
|
10677 |
},
|
10678 |
{
|
|
|
10819 |
"epoch": 74.0,
|
10820 |
"eval_accuracy": 0.8953068592057761,
|
10821 |
"eval_loss": 0.36853671073913574,
|
10822 |
+
"eval_runtime": 0.9373,
|
10823 |
+
"eval_samples_per_second": 295.515,
|
10824 |
+
"eval_steps_per_second": 37.339,
|
10825 |
"step": 14504
|
10826 |
},
|
10827 |
{
|
|
|
10968 |
"epoch": 75.0,
|
10969 |
"eval_accuracy": 0.8158844765342961,
|
10970 |
"eval_loss": 0.7026161551475525,
|
10971 |
+
"eval_runtime": 0.9279,
|
10972 |
+
"eval_samples_per_second": 298.519,
|
10973 |
+
"eval_steps_per_second": 37.719,
|
10974 |
"step": 14700
|
10975 |
},
|
10976 |
{
|
|
|
11110 |
"epoch": 76.0,
|
11111 |
"eval_accuracy": 0.9169675090252708,
|
11112 |
"eval_loss": 0.40481600165367126,
|
11113 |
+
"eval_runtime": 0.9401,
|
11114 |
+
"eval_samples_per_second": 294.635,
|
11115 |
+
"eval_steps_per_second": 37.228,
|
11116 |
"step": 14896
|
11117 |
},
|
11118 |
{
|
|
|
11259 |
"epoch": 77.0,
|
11260 |
"eval_accuracy": 0.8844765342960289,
|
11261 |
"eval_loss": 0.48912858963012695,
|
11262 |
+
"eval_runtime": 0.9257,
|
11263 |
+
"eval_samples_per_second": 299.23,
|
11264 |
+
"eval_steps_per_second": 37.809,
|
11265 |
"step": 15092
|
11266 |
},
|
11267 |
{
|
|
|
11401 |
"epoch": 78.0,
|
11402 |
"eval_accuracy": 0.8772563176895307,
|
11403 |
"eval_loss": 0.42159637808799744,
|
11404 |
+
"eval_runtime": 0.9931,
|
11405 |
+
"eval_samples_per_second": 278.916,
|
11406 |
+
"eval_steps_per_second": 35.242,
|
11407 |
"step": 15288
|
11408 |
},
|
11409 |
{
|
|
|
11550 |
"epoch": 79.0,
|
11551 |
"eval_accuracy": 0.8953068592057761,
|
11552 |
"eval_loss": 0.2720978558063507,
|
11553 |
+
"eval_runtime": 0.9347,
|
11554 |
+
"eval_samples_per_second": 296.358,
|
11555 |
+
"eval_steps_per_second": 37.446,
|
11556 |
"step": 15484
|
11557 |
},
|
11558 |
{
|
|
|
11699 |
"epoch": 80.0,
|
11700 |
"eval_accuracy": 0.8483754512635379,
|
11701 |
"eval_loss": 0.42701977491378784,
|
11702 |
+
"eval_runtime": 0.9306,
|
11703 |
+
"eval_samples_per_second": 297.657,
|
11704 |
+
"eval_steps_per_second": 37.61,
|
11705 |
"step": 15680
|
11706 |
},
|
11707 |
{
|
|
|
11841 |
"epoch": 81.0,
|
11842 |
"eval_accuracy": 0.7833935018050542,
|
11843 |
"eval_loss": 0.763225793838501,
|
11844 |
+
"eval_runtime": 0.9357,
|
11845 |
+
"eval_samples_per_second": 296.038,
|
11846 |
+
"eval_steps_per_second": 37.405,
|
11847 |
"step": 15876
|
11848 |
},
|
11849 |
{
|
|
|
11990 |
"epoch": 82.0,
|
11991 |
"eval_accuracy": 0.9025270758122743,
|
11992 |
"eval_loss": 0.3249270021915436,
|
11993 |
+
"eval_runtime": 0.9334,
|
11994 |
+
"eval_samples_per_second": 296.754,
|
11995 |
+
"eval_steps_per_second": 37.496,
|
11996 |
"step": 16072
|
11997 |
},
|
11998 |
{
|
|
|
12132 |
"epoch": 83.0,
|
12133 |
"eval_accuracy": 0.8989169675090253,
|
12134 |
"eval_loss": 0.38384127616882324,
|
12135 |
+
"eval_runtime": 0.9338,
|
12136 |
+
"eval_samples_per_second": 296.64,
|
12137 |
+
"eval_steps_per_second": 37.482,
|
12138 |
"step": 16268
|
12139 |
},
|
12140 |
{
|
|
|
12281 |
"epoch": 84.0,
|
12282 |
"eval_accuracy": 0.9205776173285198,
|
12283 |
"eval_loss": 0.3329784572124481,
|
12284 |
+
"eval_runtime": 0.9338,
|
12285 |
+
"eval_samples_per_second": 296.638,
|
12286 |
+
"eval_steps_per_second": 37.481,
|
12287 |
"step": 16464
|
12288 |
},
|
12289 |
{
|
|
|
12430 |
"epoch": 85.0,
|
12431 |
"eval_accuracy": 0.8700361010830325,
|
12432 |
"eval_loss": 0.32456666231155396,
|
12433 |
+
"eval_runtime": 0.9335,
|
12434 |
+
"eval_samples_per_second": 296.719,
|
12435 |
+
"eval_steps_per_second": 37.492,
|
12436 |
"step": 16660
|
12437 |
},
|
12438 |
{
|
|
|
12572 |
"epoch": 86.0,
|
12573 |
"eval_accuracy": 0.8736462093862816,
|
12574 |
"eval_loss": 0.3710058927536011,
|
12575 |
+
"eval_runtime": 0.9462,
|
12576 |
+
"eval_samples_per_second": 292.762,
|
12577 |
+
"eval_steps_per_second": 36.992,
|
12578 |
"step": 16856
|
12579 |
},
|
12580 |
{
|
|
|
12721 |
"epoch": 87.0,
|
12722 |
"eval_accuracy": 0.9061371841155235,
|
12723 |
"eval_loss": 0.33839184045791626,
|
12724 |
+
"eval_runtime": 0.9931,
|
12725 |
+
"eval_samples_per_second": 278.938,
|
12726 |
+
"eval_steps_per_second": 35.245,
|
12727 |
"step": 17052
|
12728 |
},
|
12729 |
{
|
|
|
12863 |
"epoch": 88.0,
|
12864 |
"eval_accuracy": 0.9097472924187726,
|
12865 |
"eval_loss": 0.3703186511993408,
|
12866 |
+
"eval_runtime": 0.9324,
|
12867 |
+
"eval_samples_per_second": 297.094,
|
12868 |
+
"eval_steps_per_second": 37.539,
|
12869 |
"step": 17248
|
12870 |
},
|
12871 |
{
|
|
|
13012 |
"epoch": 89.0,
|
13013 |
"eval_accuracy": 0.8592057761732852,
|
13014 |
"eval_loss": 0.5013492703437805,
|
13015 |
+
"eval_runtime": 0.9311,
|
13016 |
+
"eval_samples_per_second": 297.495,
|
13017 |
+
"eval_steps_per_second": 37.59,
|
13018 |
"step": 17444
|
13019 |
},
|
13020 |
{
|
|
|
13161 |
"epoch": 90.0,
|
13162 |
"eval_accuracy": 0.8989169675090253,
|
13163 |
"eval_loss": 0.3456423580646515,
|
13164 |
+
"eval_runtime": 0.9297,
|
13165 |
+
"eval_samples_per_second": 297.96,
|
13166 |
+
"eval_steps_per_second": 37.648,
|
13167 |
"step": 17640
|
13168 |
},
|
13169 |
{
|
|
|
13303 |
"epoch": 91.0,
|
13304 |
"eval_accuracy": 0.8880866425992779,
|
13305 |
"eval_loss": 0.3798539340496063,
|
13306 |
+
"eval_runtime": 0.9367,
|
13307 |
+
"eval_samples_per_second": 295.72,
|
13308 |
+
"eval_steps_per_second": 37.365,
|
13309 |
"step": 17836
|
13310 |
},
|
13311 |
{
|
|
|
13452 |
"epoch": 92.0,
|
13453 |
"eval_accuracy": 0.9061371841155235,
|
13454 |
"eval_loss": 0.32391440868377686,
|
13455 |
+
"eval_runtime": 0.9318,
|
13456 |
+
"eval_samples_per_second": 297.278,
|
13457 |
+
"eval_steps_per_second": 37.562,
|
13458 |
"step": 18032
|
13459 |
},
|
13460 |
{
|
|
|
13594 |
"epoch": 93.0,
|
13595 |
"eval_accuracy": 0.8989169675090253,
|
13596 |
"eval_loss": 0.4861180782318115,
|
13597 |
+
"eval_runtime": 0.9969,
|
13598 |
+
"eval_samples_per_second": 277.851,
|
13599 |
+
"eval_steps_per_second": 35.107,
|
13600 |
"step": 18228
|
13601 |
},
|
13602 |
{
|
|
|
13743 |
"epoch": 94.0,
|
13744 |
"eval_accuracy": 0.8736462093862816,
|
13745 |
"eval_loss": 0.4443919062614441,
|
13746 |
+
"eval_runtime": 0.9334,
|
13747 |
+
"eval_samples_per_second": 296.762,
|
13748 |
+
"eval_steps_per_second": 37.497,
|
13749 |
"step": 18424
|
13750 |
},
|
13751 |
{
|
|
|
13892 |
"epoch": 95.0,
|
13893 |
"eval_accuracy": 0.8844765342960289,
|
13894 |
"eval_loss": 0.3712524473667145,
|
13895 |
+
"eval_runtime": 0.9337,
|
13896 |
+
"eval_samples_per_second": 296.658,
|
13897 |
+
"eval_steps_per_second": 37.484,
|
13898 |
"step": 18620
|
13899 |
},
|
13900 |
{
|
|
|
14034 |
"epoch": 96.0,
|
14035 |
"eval_accuracy": 0.8303249097472925,
|
14036 |
"eval_loss": 0.427941232919693,
|
14037 |
+
"eval_runtime": 0.9388,
|
14038 |
+
"eval_samples_per_second": 295.043,
|
14039 |
+
"eval_steps_per_second": 37.28,
|
14040 |
"step": 18816
|
14041 |
},
|
14042 |
{
|
|
|
14183 |
"epoch": 97.0,
|
14184 |
"eval_accuracy": 0.8411552346570397,
|
14185 |
"eval_loss": 0.6587985157966614,
|
14186 |
+
"eval_runtime": 0.9391,
|
14187 |
+
"eval_samples_per_second": 294.975,
|
14188 |
+
"eval_steps_per_second": 37.271,
|
14189 |
"step": 19012
|
14190 |
},
|
14191 |
{
|
|
|
14325 |
"epoch": 98.0,
|
14326 |
"eval_accuracy": 0.8267148014440433,
|
14327 |
"eval_loss": 0.66323322057724,
|
14328 |
+
"eval_runtime": 0.9369,
|
14329 |
+
"eval_samples_per_second": 295.657,
|
14330 |
+
"eval_steps_per_second": 37.357,
|
14331 |
"step": 19208
|
14332 |
},
|
14333 |
{
|
|
|
14474 |
"epoch": 99.0,
|
14475 |
"eval_accuracy": 0.8808664259927798,
|
14476 |
"eval_loss": 0.4641692638397217,
|
14477 |
+
"eval_runtime": 0.9404,
|
14478 |
+
"eval_samples_per_second": 294.555,
|
14479 |
+
"eval_steps_per_second": 37.218,
|
14480 |
"step": 19404
|
14481 |
},
|
14482 |
{
|
|
|
14623 |
"epoch": 100.0,
|
14624 |
"eval_accuracy": 0.8808664259927798,
|
14625 |
"eval_loss": 0.3624129593372345,
|
14626 |
+
"eval_runtime": 1.0032,
|
14627 |
+
"eval_samples_per_second": 276.121,
|
14628 |
+
"eval_steps_per_second": 34.889,
|
14629 |
"step": 19600
|
14630 |
},
|
14631 |
{
|
|
|
14633 |
"step": 19600,
|
14634 |
"total_flos": 5.678990728814592e+17,
|
14635 |
"train_loss": 0.30055975163317455,
|
14636 |
+
"train_runtime": 949.6972,
|
14637 |
+
"train_samples_per_second": 164.895,
|
14638 |
+
"train_steps_per_second": 20.638
|
14639 |
}
|
14640 |
],
|
14641 |
"logging_steps": 10,
|