CristianR8 commited on
Commit
3dcd2a2
1 Parent(s): ca27277

End of training

Browse files
Files changed (5) hide show
  1. README.md +5 -3
  2. all_results.json +6 -6
  3. eval_results.json +3 -3
  4. train_results.json +3 -3
  5. trainer_state.json +304 -304
README.md CHANGED
@@ -3,6 +3,8 @@ library_name: transformers
3
  license: apache-2.0
4
  base_model: google/efficientnet-b0
5
  tags:
 
 
6
  - generated_from_trainer
7
  metrics:
8
  - accuracy
@@ -16,10 +18,10 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  # efficientnet-b0-cocoa
18
 
19
- This model is a fine-tuned version of [google/efficientnet-b0](https://huggingface.co/google/efficientnet-b0) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
- - Loss: 0.3624
22
- - Accuracy: 0.8809
23
 
24
  ## Model description
25
 
 
3
  license: apache-2.0
4
  base_model: google/efficientnet-b0
5
  tags:
6
+ - image-classification
7
+ - vision
8
  - generated_from_trainer
9
  metrics:
10
  - accuracy
 
18
 
19
  # efficientnet-b0-cocoa
20
 
21
+ This model is a fine-tuned version of [google/efficientnet-b0](https://huggingface.co/google/efficientnet-b0) on the SemilleroCV/Cocoa-dataset dataset.
22
  It achieves the following results on the evaluation set:
23
+ - Loss: 0.2657
24
+ - Accuracy: 0.9097
25
 
26
  ## Model description
27
 
all_results.json CHANGED
@@ -2,12 +2,12 @@
2
  "epoch": 100.0,
3
  "eval_accuracy": 0.9097472924187726,
4
  "eval_loss": 0.26566287875175476,
5
- "eval_runtime": 0.9695,
6
- "eval_samples_per_second": 285.718,
7
- "eval_steps_per_second": 36.102,
8
  "total_flos": 5.678990728814592e+17,
9
  "train_loss": 0.30055975163317455,
10
- "train_runtime": 936.3063,
11
- "train_samples_per_second": 167.253,
12
- "train_steps_per_second": 20.933
13
  }
 
2
  "epoch": 100.0,
3
  "eval_accuracy": 0.9097472924187726,
4
  "eval_loss": 0.26566287875175476,
5
+ "eval_runtime": 0.9793,
6
+ "eval_samples_per_second": 282.857,
7
+ "eval_steps_per_second": 35.74,
8
  "total_flos": 5.678990728814592e+17,
9
  "train_loss": 0.30055975163317455,
10
+ "train_runtime": 949.6972,
11
+ "train_samples_per_second": 164.895,
12
+ "train_steps_per_second": 20.638
13
  }
eval_results.json CHANGED
@@ -2,7 +2,7 @@
2
  "epoch": 100.0,
3
  "eval_accuracy": 0.9097472924187726,
4
  "eval_loss": 0.26566287875175476,
5
- "eval_runtime": 0.9695,
6
- "eval_samples_per_second": 285.718,
7
- "eval_steps_per_second": 36.102
8
  }
 
2
  "epoch": 100.0,
3
  "eval_accuracy": 0.9097472924187726,
4
  "eval_loss": 0.26566287875175476,
5
+ "eval_runtime": 0.9793,
6
+ "eval_samples_per_second": 282.857,
7
+ "eval_steps_per_second": 35.74
8
  }
train_results.json CHANGED
@@ -2,7 +2,7 @@
2
  "epoch": 100.0,
3
  "total_flos": 5.678990728814592e+17,
4
  "train_loss": 0.30055975163317455,
5
- "train_runtime": 936.3063,
6
- "train_samples_per_second": 167.253,
7
- "train_steps_per_second": 20.933
8
  }
 
2
  "epoch": 100.0,
3
  "total_flos": 5.678990728814592e+17,
4
  "train_loss": 0.30055975163317455,
5
+ "train_runtime": 949.6972,
6
+ "train_samples_per_second": 164.895,
7
+ "train_steps_per_second": 20.638
8
  }
trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "best_metric": 0.26566287875175476,
3
- "best_model_checkpoint": "./cocoa_outputs_efficientnet/checkpoint-6468",
4
  "epoch": 100.0,
5
  "eval_steps": 500,
6
  "global_step": 19600,
@@ -145,9 +145,9 @@
145
  "epoch": 1.0,
146
  "eval_accuracy": 0.5595667870036101,
147
  "eval_loss": 1.5222723484039307,
148
- "eval_runtime": 0.9623,
149
- "eval_samples_per_second": 287.86,
150
- "eval_steps_per_second": 36.372,
151
  "step": 196
152
  },
153
  {
@@ -294,9 +294,9 @@
294
  "epoch": 2.0,
295
  "eval_accuracy": 0.8303249097472925,
296
  "eval_loss": 0.8974758386611938,
297
- "eval_runtime": 0.9254,
298
- "eval_samples_per_second": 299.328,
299
- "eval_steps_per_second": 37.821,
300
  "step": 392
301
  },
302
  {
@@ -436,9 +436,9 @@
436
  "epoch": 3.0,
437
  "eval_accuracy": 0.8772563176895307,
438
  "eval_loss": 0.6563544273376465,
439
- "eval_runtime": 0.9258,
440
- "eval_samples_per_second": 299.212,
441
- "eval_steps_per_second": 37.807,
442
  "step": 588
443
  },
444
  {
@@ -585,9 +585,9 @@
585
  "epoch": 4.0,
586
  "eval_accuracy": 0.8339350180505415,
587
  "eval_loss": 0.6841569542884827,
588
- "eval_runtime": 0.9246,
589
- "eval_samples_per_second": 299.576,
590
- "eval_steps_per_second": 37.853,
591
  "step": 784
592
  },
593
  {
@@ -734,9 +734,9 @@
734
  "epoch": 5.0,
735
  "eval_accuracy": 0.8808664259927798,
736
  "eval_loss": 0.48941850662231445,
737
- "eval_runtime": 0.9211,
738
- "eval_samples_per_second": 300.733,
739
- "eval_steps_per_second": 37.999,
740
  "step": 980
741
  },
742
  {
@@ -876,9 +876,9 @@
876
  "epoch": 6.0,
877
  "eval_accuracy": 0.8736462093862816,
878
  "eval_loss": 0.41603580117225647,
879
- "eval_runtime": 0.9268,
880
- "eval_samples_per_second": 298.89,
881
- "eval_steps_per_second": 37.766,
882
  "step": 1176
883
  },
884
  {
@@ -1025,9 +1025,9 @@
1025
  "epoch": 7.0,
1026
  "eval_accuracy": 0.8844765342960289,
1027
  "eval_loss": 0.40221381187438965,
1028
- "eval_runtime": 0.9961,
1029
- "eval_samples_per_second": 278.09,
1030
- "eval_steps_per_second": 35.138,
1031
  "step": 1372
1032
  },
1033
  {
@@ -1167,9 +1167,9 @@
1167
  "epoch": 8.0,
1168
  "eval_accuracy": 0.8411552346570397,
1169
  "eval_loss": 0.4939042627811432,
1170
- "eval_runtime": 0.9269,
1171
- "eval_samples_per_second": 298.835,
1172
- "eval_steps_per_second": 37.759,
1173
  "step": 1568
1174
  },
1175
  {
@@ -1316,9 +1316,9 @@
1316
  "epoch": 9.0,
1317
  "eval_accuracy": 0.8772563176895307,
1318
  "eval_loss": 0.35403916239738464,
1319
- "eval_runtime": 0.9961,
1320
- "eval_samples_per_second": 278.089,
1321
- "eval_steps_per_second": 35.138,
1322
  "step": 1764
1323
  },
1324
  {
@@ -1465,9 +1465,9 @@
1465
  "epoch": 10.0,
1466
  "eval_accuracy": 0.8953068592057761,
1467
  "eval_loss": 0.349290668964386,
1468
- "eval_runtime": 0.9261,
1469
- "eval_samples_per_second": 299.092,
1470
- "eval_steps_per_second": 37.791,
1471
  "step": 1960
1472
  },
1473
  {
@@ -1607,9 +1607,9 @@
1607
  "epoch": 11.0,
1608
  "eval_accuracy": 0.776173285198556,
1609
  "eval_loss": 0.7928438186645508,
1610
- "eval_runtime": 0.9258,
1611
- "eval_samples_per_second": 299.201,
1612
- "eval_steps_per_second": 37.805,
1613
  "step": 2156
1614
  },
1615
  {
@@ -1756,9 +1756,9 @@
1756
  "epoch": 12.0,
1757
  "eval_accuracy": 0.296028880866426,
1758
  "eval_loss": 2.06593918800354,
1759
- "eval_runtime": 0.9316,
1760
- "eval_samples_per_second": 297.347,
1761
- "eval_steps_per_second": 37.571,
1762
  "step": 2352
1763
  },
1764
  {
@@ -1898,9 +1898,9 @@
1898
  "epoch": 13.0,
1899
  "eval_accuracy": 0.851985559566787,
1900
  "eval_loss": 0.44439464807510376,
1901
- "eval_runtime": 0.9238,
1902
- "eval_samples_per_second": 299.863,
1903
- "eval_steps_per_second": 37.889,
1904
  "step": 2548
1905
  },
1906
  {
@@ -2047,9 +2047,9 @@
2047
  "epoch": 14.0,
2048
  "eval_accuracy": 0.8736462093862816,
2049
  "eval_loss": 0.46400919556617737,
2050
- "eval_runtime": 0.9277,
2051
- "eval_samples_per_second": 298.595,
2052
- "eval_steps_per_second": 37.729,
2053
  "step": 2744
2054
  },
2055
  {
@@ -2196,9 +2196,9 @@
2196
  "epoch": 15.0,
2197
  "eval_accuracy": 0.8772563176895307,
2198
  "eval_loss": 0.37753719091415405,
2199
- "eval_runtime": 0.9263,
2200
- "eval_samples_per_second": 299.04,
2201
- "eval_steps_per_second": 37.785,
2202
  "step": 2940
2203
  },
2204
  {
@@ -2338,9 +2338,9 @@
2338
  "epoch": 16.0,
2339
  "eval_accuracy": 0.8880866425992779,
2340
  "eval_loss": 0.3519056737422943,
2341
- "eval_runtime": 0.9249,
2342
- "eval_samples_per_second": 299.483,
2343
- "eval_steps_per_second": 37.841,
2344
  "step": 3136
2345
  },
2346
  {
@@ -2487,9 +2487,9 @@
2487
  "epoch": 17.0,
2488
  "eval_accuracy": 0.9061371841155235,
2489
  "eval_loss": 0.33103030920028687,
2490
- "eval_runtime": 0.9321,
2491
- "eval_samples_per_second": 297.184,
2492
- "eval_steps_per_second": 37.55,
2493
  "step": 3332
2494
  },
2495
  {
@@ -2629,9 +2629,9 @@
2629
  "epoch": 18.0,
2630
  "eval_accuracy": 0.8916967509025271,
2631
  "eval_loss": 0.34751203656196594,
2632
- "eval_runtime": 0.9902,
2633
- "eval_samples_per_second": 279.742,
2634
- "eval_steps_per_second": 35.346,
2635
  "step": 3528
2636
  },
2637
  {
@@ -2778,9 +2778,9 @@
2778
  "epoch": 19.0,
2779
  "eval_accuracy": 0.8592057761732852,
2780
  "eval_loss": 0.38391339778900146,
2781
- "eval_runtime": 0.9252,
2782
- "eval_samples_per_second": 299.384,
2783
- "eval_steps_per_second": 37.828,
2784
  "step": 3724
2785
  },
2786
  {
@@ -2927,9 +2927,9 @@
2927
  "epoch": 20.0,
2928
  "eval_accuracy": 0.9133574007220217,
2929
  "eval_loss": 0.3031846880912781,
2930
- "eval_runtime": 0.9294,
2931
- "eval_samples_per_second": 298.047,
2932
- "eval_steps_per_second": 37.659,
2933
  "step": 3920
2934
  },
2935
  {
@@ -3069,9 +3069,9 @@
3069
  "epoch": 21.0,
3070
  "eval_accuracy": 0.851985559566787,
3071
  "eval_loss": 0.4246116876602173,
3072
- "eval_runtime": 0.9793,
3073
- "eval_samples_per_second": 282.866,
3074
- "eval_steps_per_second": 35.741,
3075
  "step": 4116
3076
  },
3077
  {
@@ -3218,9 +3218,9 @@
3218
  "epoch": 22.0,
3219
  "eval_accuracy": 0.8989169675090253,
3220
  "eval_loss": 0.29509276151657104,
3221
- "eval_runtime": 0.9468,
3222
- "eval_samples_per_second": 292.564,
3223
- "eval_steps_per_second": 36.967,
3224
  "step": 4312
3225
  },
3226
  {
@@ -3360,9 +3360,9 @@
3360
  "epoch": 23.0,
3361
  "eval_accuracy": 0.851985559566787,
3362
  "eval_loss": 0.4356595277786255,
3363
- "eval_runtime": 0.9291,
3364
- "eval_samples_per_second": 298.141,
3365
- "eval_steps_per_second": 37.671,
3366
  "step": 4508
3367
  },
3368
  {
@@ -3509,9 +3509,9 @@
3509
  "epoch": 24.0,
3510
  "eval_accuracy": 0.8916967509025271,
3511
  "eval_loss": 0.399036169052124,
3512
- "eval_runtime": 0.9832,
3513
- "eval_samples_per_second": 281.719,
3514
- "eval_steps_per_second": 35.596,
3515
  "step": 4704
3516
  },
3517
  {
@@ -3658,9 +3658,9 @@
3658
  "epoch": 25.0,
3659
  "eval_accuracy": 0.9097472924187726,
3660
  "eval_loss": 0.35359257459640503,
3661
- "eval_runtime": 0.9278,
3662
- "eval_samples_per_second": 298.55,
3663
- "eval_steps_per_second": 37.723,
3664
  "step": 4900
3665
  },
3666
  {
@@ -3800,9 +3800,9 @@
3800
  "epoch": 26.0,
3801
  "eval_accuracy": 0.8592057761732852,
3802
  "eval_loss": 0.4166140854358673,
3803
- "eval_runtime": 0.9508,
3804
- "eval_samples_per_second": 291.327,
3805
- "eval_steps_per_second": 36.81,
3806
  "step": 5096
3807
  },
3808
  {
@@ -3949,9 +3949,9 @@
3949
  "epoch": 27.0,
3950
  "eval_accuracy": 0.851985559566787,
3951
  "eval_loss": 0.4353993237018585,
3952
- "eval_runtime": 0.9437,
3953
- "eval_samples_per_second": 293.541,
3954
- "eval_steps_per_second": 37.09,
3955
  "step": 5292
3956
  },
3957
  {
@@ -4091,9 +4091,9 @@
4091
  "epoch": 28.0,
4092
  "eval_accuracy": 0.8592057761732852,
4093
  "eval_loss": 0.4088672697544098,
4094
- "eval_runtime": 0.9296,
4095
- "eval_samples_per_second": 297.977,
4096
- "eval_steps_per_second": 37.651,
4097
  "step": 5488
4098
  },
4099
  {
@@ -4240,9 +4240,9 @@
4240
  "epoch": 29.0,
4241
  "eval_accuracy": 0.8231046931407943,
4242
  "eval_loss": 0.4787161946296692,
4243
- "eval_runtime": 0.9706,
4244
- "eval_samples_per_second": 285.392,
4245
- "eval_steps_per_second": 36.06,
4246
  "step": 5684
4247
  },
4248
  {
@@ -4389,9 +4389,9 @@
4389
  "epoch": 30.0,
4390
  "eval_accuracy": 0.9097472924187726,
4391
  "eval_loss": 0.3165305256843567,
4392
- "eval_runtime": 0.9312,
4393
- "eval_samples_per_second": 297.455,
4394
- "eval_steps_per_second": 37.585,
4395
  "step": 5880
4396
  },
4397
  {
@@ -4531,9 +4531,9 @@
4531
  "epoch": 31.0,
4532
  "eval_accuracy": 0.9133574007220217,
4533
  "eval_loss": 0.31053850054740906,
4534
- "eval_runtime": 0.9255,
4535
- "eval_samples_per_second": 299.294,
4536
- "eval_steps_per_second": 37.817,
4537
  "step": 6076
4538
  },
4539
  {
@@ -4680,9 +4680,9 @@
4680
  "epoch": 32.0,
4681
  "eval_accuracy": 0.9061371841155235,
4682
  "eval_loss": 0.3559906780719757,
4683
- "eval_runtime": 0.9627,
4684
- "eval_samples_per_second": 287.745,
4685
- "eval_steps_per_second": 36.358,
4686
  "step": 6272
4687
  },
4688
  {
@@ -4822,9 +4822,9 @@
4822
  "epoch": 33.0,
4823
  "eval_accuracy": 0.9097472924187726,
4824
  "eval_loss": 0.26566287875175476,
4825
- "eval_runtime": 0.928,
4826
- "eval_samples_per_second": 298.475,
4827
- "eval_steps_per_second": 37.714,
4828
  "step": 6468
4829
  },
4830
  {
@@ -4971,9 +4971,9 @@
4971
  "epoch": 34.0,
4972
  "eval_accuracy": 0.9133574007220217,
4973
  "eval_loss": 0.2679595947265625,
4974
- "eval_runtime": 0.9366,
4975
- "eval_samples_per_second": 295.757,
4976
- "eval_steps_per_second": 37.37,
4977
  "step": 6664
4978
  },
4979
  {
@@ -5120,9 +5120,9 @@
5120
  "epoch": 35.0,
5121
  "eval_accuracy": 0.9061371841155235,
5122
  "eval_loss": 0.3797638416290283,
5123
- "eval_runtime": 0.9257,
5124
- "eval_samples_per_second": 299.246,
5125
- "eval_steps_per_second": 37.811,
5126
  "step": 6860
5127
  },
5128
  {
@@ -5262,9 +5262,9 @@
5262
  "epoch": 36.0,
5263
  "eval_accuracy": 0.855595667870036,
5264
  "eval_loss": 0.5098311305046082,
5265
- "eval_runtime": 0.9275,
5266
- "eval_samples_per_second": 298.64,
5267
- "eval_steps_per_second": 37.734,
5268
  "step": 7056
5269
  },
5270
  {
@@ -5411,9 +5411,9 @@
5411
  "epoch": 37.0,
5412
  "eval_accuracy": 0.8808664259927798,
5413
  "eval_loss": 0.42190420627593994,
5414
- "eval_runtime": 0.9289,
5415
- "eval_samples_per_second": 298.203,
5416
- "eval_steps_per_second": 37.679,
5417
  "step": 7252
5418
  },
5419
  {
@@ -5553,9 +5553,9 @@
5553
  "epoch": 38.0,
5554
  "eval_accuracy": 0.9133574007220217,
5555
  "eval_loss": 0.2851579189300537,
5556
- "eval_runtime": 0.9232,
5557
- "eval_samples_per_second": 300.035,
5558
- "eval_steps_per_second": 37.911,
5559
  "step": 7448
5560
  },
5561
  {
@@ -5702,9 +5702,9 @@
5702
  "epoch": 39.0,
5703
  "eval_accuracy": 0.8989169675090253,
5704
  "eval_loss": 0.36030298471450806,
5705
- "eval_runtime": 0.9253,
5706
- "eval_samples_per_second": 299.352,
5707
- "eval_steps_per_second": 37.824,
5708
  "step": 7644
5709
  },
5710
  {
@@ -5851,9 +5851,9 @@
5851
  "epoch": 40.0,
5852
  "eval_accuracy": 0.8736462093862816,
5853
  "eval_loss": 0.351894736289978,
5854
- "eval_runtime": 0.9281,
5855
- "eval_samples_per_second": 298.457,
5856
- "eval_steps_per_second": 37.711,
5857
  "step": 7840
5858
  },
5859
  {
@@ -5993,9 +5993,9 @@
5993
  "epoch": 41.0,
5994
  "eval_accuracy": 0.9025270758122743,
5995
  "eval_loss": 0.3343473970890045,
5996
- "eval_runtime": 0.928,
5997
- "eval_samples_per_second": 298.486,
5998
- "eval_steps_per_second": 37.715,
5999
  "step": 8036
6000
  },
6001
  {
@@ -6142,9 +6142,9 @@
6142
  "epoch": 42.0,
6143
  "eval_accuracy": 0.9169675090252708,
6144
  "eval_loss": 0.3383941352367401,
6145
- "eval_runtime": 0.9259,
6146
- "eval_samples_per_second": 299.182,
6147
- "eval_steps_per_second": 37.803,
6148
  "step": 8232
6149
  },
6150
  {
@@ -6284,9 +6284,9 @@
6284
  "epoch": 43.0,
6285
  "eval_accuracy": 0.8772563176895307,
6286
  "eval_loss": 0.40458711981773376,
6287
- "eval_runtime": 0.9234,
6288
- "eval_samples_per_second": 299.99,
6289
- "eval_steps_per_second": 37.905,
6290
  "step": 8428
6291
  },
6292
  {
@@ -6433,9 +6433,9 @@
6433
  "epoch": 44.0,
6434
  "eval_accuracy": 0.8916967509025271,
6435
  "eval_loss": 0.39525121450424194,
6436
- "eval_runtime": 0.9242,
6437
- "eval_samples_per_second": 299.71,
6438
- "eval_steps_per_second": 37.87,
6439
  "step": 8624
6440
  },
6441
  {
@@ -6582,9 +6582,9 @@
6582
  "epoch": 45.0,
6583
  "eval_accuracy": 0.8592057761732852,
6584
  "eval_loss": 0.5002943873405457,
6585
- "eval_runtime": 0.9317,
6586
- "eval_samples_per_second": 297.301,
6587
- "eval_steps_per_second": 37.565,
6588
  "step": 8820
6589
  },
6590
  {
@@ -6724,9 +6724,9 @@
6724
  "epoch": 46.0,
6725
  "eval_accuracy": 0.9169675090252708,
6726
  "eval_loss": 0.3231888711452484,
6727
- "eval_runtime": 0.925,
6728
- "eval_samples_per_second": 299.445,
6729
- "eval_steps_per_second": 37.836,
6730
  "step": 9016
6731
  },
6732
  {
@@ -6873,9 +6873,9 @@
6873
  "epoch": 47.0,
6874
  "eval_accuracy": 0.9169675090252708,
6875
  "eval_loss": 0.3112559914588928,
6876
- "eval_runtime": 0.9224,
6877
- "eval_samples_per_second": 300.307,
6878
- "eval_steps_per_second": 37.945,
6879
  "step": 9212
6880
  },
6881
  {
@@ -7015,9 +7015,9 @@
7015
  "epoch": 48.0,
7016
  "eval_accuracy": 0.855595667870036,
7017
  "eval_loss": 0.4494384229183197,
7018
- "eval_runtime": 0.9397,
7019
- "eval_samples_per_second": 294.784,
7020
- "eval_steps_per_second": 37.247,
7021
  "step": 9408
7022
  },
7023
  {
@@ -7164,9 +7164,9 @@
7164
  "epoch": 49.0,
7165
  "eval_accuracy": 0.9205776173285198,
7166
  "eval_loss": 0.37217509746551514,
7167
- "eval_runtime": 0.9345,
7168
- "eval_samples_per_second": 296.412,
7169
- "eval_steps_per_second": 37.453,
7170
  "step": 9604
7171
  },
7172
  {
@@ -7313,9 +7313,9 @@
7313
  "epoch": 50.0,
7314
  "eval_accuracy": 0.9097472924187726,
7315
  "eval_loss": 0.2852139472961426,
7316
- "eval_runtime": 0.9274,
7317
- "eval_samples_per_second": 298.696,
7318
- "eval_steps_per_second": 37.741,
7319
  "step": 9800
7320
  },
7321
  {
@@ -7455,9 +7455,9 @@
7455
  "epoch": 51.0,
7456
  "eval_accuracy": 0.8628158844765343,
7457
  "eval_loss": 0.4137951135635376,
7458
- "eval_runtime": 0.9394,
7459
- "eval_samples_per_second": 294.867,
7460
- "eval_steps_per_second": 37.258,
7461
  "step": 9996
7462
  },
7463
  {
@@ -7604,9 +7604,9 @@
7604
  "epoch": 52.0,
7605
  "eval_accuracy": 0.8953068592057761,
7606
  "eval_loss": 0.34130236506462097,
7607
- "eval_runtime": 0.95,
7608
- "eval_samples_per_second": 291.574,
7609
- "eval_steps_per_second": 36.841,
7610
  "step": 10192
7611
  },
7612
  {
@@ -7746,9 +7746,9 @@
7746
  "epoch": 53.0,
7747
  "eval_accuracy": 0.9169675090252708,
7748
  "eval_loss": 0.30462250113487244,
7749
- "eval_runtime": 0.9555,
7750
- "eval_samples_per_second": 289.887,
7751
- "eval_steps_per_second": 36.628,
7752
  "step": 10388
7753
  },
7754
  {
@@ -7895,9 +7895,9 @@
7895
  "epoch": 54.0,
7896
  "eval_accuracy": 0.8989169675090253,
7897
  "eval_loss": 0.2849152684211731,
7898
- "eval_runtime": 0.9234,
7899
- "eval_samples_per_second": 299.993,
7900
- "eval_steps_per_second": 37.905,
7901
  "step": 10584
7902
  },
7903
  {
@@ -8044,9 +8044,9 @@
8044
  "epoch": 55.0,
8045
  "eval_accuracy": 0.9133574007220217,
8046
  "eval_loss": 0.35168057680130005,
8047
- "eval_runtime": 0.9261,
8048
- "eval_samples_per_second": 299.089,
8049
- "eval_steps_per_second": 37.791,
8050
  "step": 10780
8051
  },
8052
  {
@@ -8186,9 +8186,9 @@
8186
  "epoch": 56.0,
8187
  "eval_accuracy": 0.9025270758122743,
8188
  "eval_loss": 0.45381447672843933,
8189
- "eval_runtime": 0.9559,
8190
- "eval_samples_per_second": 289.776,
8191
- "eval_steps_per_second": 36.614,
8192
  "step": 10976
8193
  },
8194
  {
@@ -8335,9 +8335,9 @@
8335
  "epoch": 57.0,
8336
  "eval_accuracy": 0.8592057761732852,
8337
  "eval_loss": 0.44916799664497375,
8338
- "eval_runtime": 0.9386,
8339
- "eval_samples_per_second": 295.131,
8340
- "eval_steps_per_second": 37.291,
8341
  "step": 11172
8342
  },
8343
  {
@@ -8477,9 +8477,9 @@
8477
  "epoch": 58.0,
8478
  "eval_accuracy": 0.8628158844765343,
8479
  "eval_loss": 0.4738902747631073,
8480
- "eval_runtime": 0.9256,
8481
- "eval_samples_per_second": 299.274,
8482
- "eval_steps_per_second": 37.814,
8483
  "step": 11368
8484
  },
8485
  {
@@ -8626,9 +8626,9 @@
8626
  "epoch": 59.0,
8627
  "eval_accuracy": 0.9205776173285198,
8628
  "eval_loss": 0.2831103205680847,
8629
- "eval_runtime": 0.9267,
8630
- "eval_samples_per_second": 298.914,
8631
- "eval_steps_per_second": 37.769,
8632
  "step": 11564
8633
  },
8634
  {
@@ -8775,9 +8775,9 @@
8775
  "epoch": 60.0,
8776
  "eval_accuracy": 0.9205776173285198,
8777
  "eval_loss": 0.34654152393341064,
8778
- "eval_runtime": 0.924,
8779
- "eval_samples_per_second": 299.794,
8780
- "eval_steps_per_second": 37.88,
8781
  "step": 11760
8782
  },
8783
  {
@@ -8917,9 +8917,9 @@
8917
  "epoch": 61.0,
8918
  "eval_accuracy": 0.9314079422382672,
8919
  "eval_loss": 0.28843551874160767,
8920
- "eval_runtime": 0.9387,
8921
- "eval_samples_per_second": 295.083,
8922
- "eval_steps_per_second": 37.285,
8923
  "step": 11956
8924
  },
8925
  {
@@ -9066,9 +9066,9 @@
9066
  "epoch": 62.0,
9067
  "eval_accuracy": 0.8447653429602888,
9068
  "eval_loss": 0.4874745309352875,
9069
- "eval_runtime": 0.9245,
9070
- "eval_samples_per_second": 299.628,
9071
- "eval_steps_per_second": 37.859,
9072
  "step": 12152
9073
  },
9074
  {
@@ -9208,9 +9208,9 @@
9208
  "epoch": 63.0,
9209
  "eval_accuracy": 0.9061371841155235,
9210
  "eval_loss": 0.3988655209541321,
9211
- "eval_runtime": 0.9265,
9212
- "eval_samples_per_second": 298.961,
9213
- "eval_steps_per_second": 37.775,
9214
  "step": 12348
9215
  },
9216
  {
@@ -9357,9 +9357,9 @@
9357
  "epoch": 64.0,
9358
  "eval_accuracy": 0.851985559566787,
9359
  "eval_loss": 0.5952923893928528,
9360
- "eval_runtime": 0.9245,
9361
- "eval_samples_per_second": 299.616,
9362
- "eval_steps_per_second": 37.858,
9363
  "step": 12544
9364
  },
9365
  {
@@ -9506,9 +9506,9 @@
9506
  "epoch": 65.0,
9507
  "eval_accuracy": 0.927797833935018,
9508
  "eval_loss": 0.2953914701938629,
9509
- "eval_runtime": 0.921,
9510
- "eval_samples_per_second": 300.758,
9511
- "eval_steps_per_second": 38.002,
9512
  "step": 12740
9513
  },
9514
  {
@@ -9648,9 +9648,9 @@
9648
  "epoch": 66.0,
9649
  "eval_accuracy": 0.851985559566787,
9650
  "eval_loss": 0.5033073425292969,
9651
- "eval_runtime": 0.9234,
9652
- "eval_samples_per_second": 299.974,
9653
- "eval_steps_per_second": 37.903,
9654
  "step": 12936
9655
  },
9656
  {
@@ -9797,9 +9797,9 @@
9797
  "epoch": 67.0,
9798
  "eval_accuracy": 0.8808664259927798,
9799
  "eval_loss": 0.41321179270744324,
9800
- "eval_runtime": 0.9749,
9801
- "eval_samples_per_second": 284.139,
9802
- "eval_steps_per_second": 35.902,
9803
  "step": 13132
9804
  },
9805
  {
@@ -9939,9 +9939,9 @@
9939
  "epoch": 68.0,
9940
  "eval_accuracy": 0.9169675090252708,
9941
  "eval_loss": 0.37430626153945923,
9942
- "eval_runtime": 0.927,
9943
- "eval_samples_per_second": 298.802,
9944
- "eval_steps_per_second": 37.755,
9945
  "step": 13328
9946
  },
9947
  {
@@ -10088,9 +10088,9 @@
10088
  "epoch": 69.0,
10089
  "eval_accuracy": 0.776173285198556,
10090
  "eval_loss": 0.6423271298408508,
10091
- "eval_runtime": 0.9196,
10092
- "eval_samples_per_second": 301.217,
10093
- "eval_steps_per_second": 38.06,
10094
  "step": 13524
10095
  },
10096
  {
@@ -10237,9 +10237,9 @@
10237
  "epoch": 70.0,
10238
  "eval_accuracy": 0.8014440433212996,
10239
  "eval_loss": 0.5979345440864563,
10240
- "eval_runtime": 0.9248,
10241
- "eval_samples_per_second": 299.519,
10242
- "eval_steps_per_second": 37.845,
10243
  "step": 13720
10244
  },
10245
  {
@@ -10379,9 +10379,9 @@
10379
  "epoch": 71.0,
10380
  "eval_accuracy": 0.8989169675090253,
10381
  "eval_loss": 0.43981537222862244,
10382
- "eval_runtime": 0.9267,
10383
- "eval_samples_per_second": 298.919,
10384
- "eval_steps_per_second": 37.77,
10385
  "step": 13916
10386
  },
10387
  {
@@ -10528,9 +10528,9 @@
10528
  "epoch": 72.0,
10529
  "eval_accuracy": 0.8231046931407943,
10530
  "eval_loss": 0.5633912086486816,
10531
- "eval_runtime": 0.9302,
10532
- "eval_samples_per_second": 297.785,
10533
- "eval_steps_per_second": 37.626,
10534
  "step": 14112
10535
  },
10536
  {
@@ -10670,9 +10670,9 @@
10670
  "epoch": 73.0,
10671
  "eval_accuracy": 0.776173285198556,
10672
  "eval_loss": 0.620398223400116,
10673
- "eval_runtime": 0.9237,
10674
- "eval_samples_per_second": 299.897,
10675
- "eval_steps_per_second": 37.893,
10676
  "step": 14308
10677
  },
10678
  {
@@ -10819,9 +10819,9 @@
10819
  "epoch": 74.0,
10820
  "eval_accuracy": 0.8953068592057761,
10821
  "eval_loss": 0.36853671073913574,
10822
- "eval_runtime": 0.9295,
10823
- "eval_samples_per_second": 298.006,
10824
- "eval_steps_per_second": 37.654,
10825
  "step": 14504
10826
  },
10827
  {
@@ -10968,9 +10968,9 @@
10968
  "epoch": 75.0,
10969
  "eval_accuracy": 0.8158844765342961,
10970
  "eval_loss": 0.7026161551475525,
10971
- "eval_runtime": 0.9261,
10972
- "eval_samples_per_second": 299.112,
10973
- "eval_steps_per_second": 37.794,
10974
  "step": 14700
10975
  },
10976
  {
@@ -11110,9 +11110,9 @@
11110
  "epoch": 76.0,
11111
  "eval_accuracy": 0.9169675090252708,
11112
  "eval_loss": 0.40481600165367126,
11113
- "eval_runtime": 0.9284,
11114
- "eval_samples_per_second": 298.348,
11115
- "eval_steps_per_second": 37.697,
11116
  "step": 14896
11117
  },
11118
  {
@@ -11259,9 +11259,9 @@
11259
  "epoch": 77.0,
11260
  "eval_accuracy": 0.8844765342960289,
11261
  "eval_loss": 0.48912858963012695,
11262
- "eval_runtime": 0.9337,
11263
- "eval_samples_per_second": 296.677,
11264
- "eval_steps_per_second": 37.486,
11265
  "step": 15092
11266
  },
11267
  {
@@ -11401,9 +11401,9 @@
11401
  "epoch": 78.0,
11402
  "eval_accuracy": 0.8772563176895307,
11403
  "eval_loss": 0.42159637808799744,
11404
- "eval_runtime": 0.9262,
11405
- "eval_samples_per_second": 299.086,
11406
- "eval_steps_per_second": 37.791,
11407
  "step": 15288
11408
  },
11409
  {
@@ -11550,9 +11550,9 @@
11550
  "epoch": 79.0,
11551
  "eval_accuracy": 0.8953068592057761,
11552
  "eval_loss": 0.2720978558063507,
11553
- "eval_runtime": 0.9227,
11554
- "eval_samples_per_second": 300.203,
11555
- "eval_steps_per_second": 37.932,
11556
  "step": 15484
11557
  },
11558
  {
@@ -11699,9 +11699,9 @@
11699
  "epoch": 80.0,
11700
  "eval_accuracy": 0.8483754512635379,
11701
  "eval_loss": 0.42701977491378784,
11702
- "eval_runtime": 0.9196,
11703
- "eval_samples_per_second": 301.231,
11704
- "eval_steps_per_second": 38.062,
11705
  "step": 15680
11706
  },
11707
  {
@@ -11841,9 +11841,9 @@
11841
  "epoch": 81.0,
11842
  "eval_accuracy": 0.7833935018050542,
11843
  "eval_loss": 0.763225793838501,
11844
- "eval_runtime": 0.9257,
11845
- "eval_samples_per_second": 299.248,
11846
- "eval_steps_per_second": 37.811,
11847
  "step": 15876
11848
  },
11849
  {
@@ -11990,9 +11990,9 @@
11990
  "epoch": 82.0,
11991
  "eval_accuracy": 0.9025270758122743,
11992
  "eval_loss": 0.3249270021915436,
11993
- "eval_runtime": 0.9713,
11994
- "eval_samples_per_second": 285.18,
11995
- "eval_steps_per_second": 36.034,
11996
  "step": 16072
11997
  },
11998
  {
@@ -12132,9 +12132,9 @@
12132
  "epoch": 83.0,
12133
  "eval_accuracy": 0.8989169675090253,
12134
  "eval_loss": 0.38384127616882324,
12135
- "eval_runtime": 0.9259,
12136
- "eval_samples_per_second": 299.169,
12137
- "eval_steps_per_second": 37.801,
12138
  "step": 16268
12139
  },
12140
  {
@@ -12281,9 +12281,9 @@
12281
  "epoch": 84.0,
12282
  "eval_accuracy": 0.9205776173285198,
12283
  "eval_loss": 0.3329784572124481,
12284
- "eval_runtime": 0.9245,
12285
- "eval_samples_per_second": 299.612,
12286
- "eval_steps_per_second": 37.857,
12287
  "step": 16464
12288
  },
12289
  {
@@ -12430,9 +12430,9 @@
12430
  "epoch": 85.0,
12431
  "eval_accuracy": 0.8700361010830325,
12432
  "eval_loss": 0.32456666231155396,
12433
- "eval_runtime": 0.929,
12434
- "eval_samples_per_second": 298.181,
12435
- "eval_steps_per_second": 37.676,
12436
  "step": 16660
12437
  },
12438
  {
@@ -12572,9 +12572,9 @@
12572
  "epoch": 86.0,
12573
  "eval_accuracy": 0.8736462093862816,
12574
  "eval_loss": 0.3710058927536011,
12575
- "eval_runtime": 0.9876,
12576
- "eval_samples_per_second": 280.471,
12577
- "eval_steps_per_second": 35.439,
12578
  "step": 16856
12579
  },
12580
  {
@@ -12721,9 +12721,9 @@
12721
  "epoch": 87.0,
12722
  "eval_accuracy": 0.9061371841155235,
12723
  "eval_loss": 0.33839184045791626,
12724
- "eval_runtime": 0.9267,
12725
- "eval_samples_per_second": 298.923,
12726
- "eval_steps_per_second": 37.77,
12727
  "step": 17052
12728
  },
12729
  {
@@ -12863,9 +12863,9 @@
12863
  "epoch": 88.0,
12864
  "eval_accuracy": 0.9097472924187726,
12865
  "eval_loss": 0.3703186511993408,
12866
- "eval_runtime": 0.9909,
12867
- "eval_samples_per_second": 279.556,
12868
- "eval_steps_per_second": 35.323,
12869
  "step": 17248
12870
  },
12871
  {
@@ -13012,9 +13012,9 @@
13012
  "epoch": 89.0,
13013
  "eval_accuracy": 0.8592057761732852,
13014
  "eval_loss": 0.5013492703437805,
13015
- "eval_runtime": 0.9203,
13016
- "eval_samples_per_second": 300.985,
13017
- "eval_steps_per_second": 38.031,
13018
  "step": 17444
13019
  },
13020
  {
@@ -13161,9 +13161,9 @@
13161
  "epoch": 90.0,
13162
  "eval_accuracy": 0.8989169675090253,
13163
  "eval_loss": 0.3456423580646515,
13164
- "eval_runtime": 1.0017,
13165
- "eval_samples_per_second": 276.522,
13166
- "eval_steps_per_second": 34.94,
13167
  "step": 17640
13168
  },
13169
  {
@@ -13303,9 +13303,9 @@
13303
  "epoch": 91.0,
13304
  "eval_accuracy": 0.8880866425992779,
13305
  "eval_loss": 0.3798539340496063,
13306
- "eval_runtime": 0.9203,
13307
- "eval_samples_per_second": 301.002,
13308
- "eval_steps_per_second": 38.033,
13309
  "step": 17836
13310
  },
13311
  {
@@ -13452,9 +13452,9 @@
13452
  "epoch": 92.0,
13453
  "eval_accuracy": 0.9061371841155235,
13454
  "eval_loss": 0.32391440868377686,
13455
- "eval_runtime": 0.9941,
13456
- "eval_samples_per_second": 278.638,
13457
- "eval_steps_per_second": 35.207,
13458
  "step": 18032
13459
  },
13460
  {
@@ -13594,9 +13594,9 @@
13594
  "epoch": 93.0,
13595
  "eval_accuracy": 0.8989169675090253,
13596
  "eval_loss": 0.4861180782318115,
13597
- "eval_runtime": 0.923,
13598
- "eval_samples_per_second": 300.096,
13599
- "eval_steps_per_second": 37.918,
13600
  "step": 18228
13601
  },
13602
  {
@@ -13743,9 +13743,9 @@
13743
  "epoch": 94.0,
13744
  "eval_accuracy": 0.8736462093862816,
13745
  "eval_loss": 0.4443919062614441,
13746
- "eval_runtime": 0.9312,
13747
- "eval_samples_per_second": 297.478,
13748
- "eval_steps_per_second": 37.587,
13749
  "step": 18424
13750
  },
13751
  {
@@ -13892,9 +13892,9 @@
13892
  "epoch": 95.0,
13893
  "eval_accuracy": 0.8844765342960289,
13894
  "eval_loss": 0.3712524473667145,
13895
- "eval_runtime": 0.9321,
13896
- "eval_samples_per_second": 297.175,
13897
- "eval_steps_per_second": 37.549,
13898
  "step": 18620
13899
  },
13900
  {
@@ -14034,9 +14034,9 @@
14034
  "epoch": 96.0,
14035
  "eval_accuracy": 0.8303249097472925,
14036
  "eval_loss": 0.427941232919693,
14037
- "eval_runtime": 1.0012,
14038
- "eval_samples_per_second": 276.68,
14039
- "eval_steps_per_second": 34.96,
14040
  "step": 18816
14041
  },
14042
  {
@@ -14183,9 +14183,9 @@
14183
  "epoch": 97.0,
14184
  "eval_accuracy": 0.8411552346570397,
14185
  "eval_loss": 0.6587985157966614,
14186
- "eval_runtime": 0.937,
14187
- "eval_samples_per_second": 295.619,
14188
- "eval_steps_per_second": 37.353,
14189
  "step": 19012
14190
  },
14191
  {
@@ -14325,9 +14325,9 @@
14325
  "epoch": 98.0,
14326
  "eval_accuracy": 0.8267148014440433,
14327
  "eval_loss": 0.66323322057724,
14328
- "eval_runtime": 0.928,
14329
- "eval_samples_per_second": 298.496,
14330
- "eval_steps_per_second": 37.716,
14331
  "step": 19208
14332
  },
14333
  {
@@ -14474,9 +14474,9 @@
14474
  "epoch": 99.0,
14475
  "eval_accuracy": 0.8808664259927798,
14476
  "eval_loss": 0.4641692638397217,
14477
- "eval_runtime": 0.9262,
14478
- "eval_samples_per_second": 299.067,
14479
- "eval_steps_per_second": 37.788,
14480
  "step": 19404
14481
  },
14482
  {
@@ -14623,9 +14623,9 @@
14623
  "epoch": 100.0,
14624
  "eval_accuracy": 0.8808664259927798,
14625
  "eval_loss": 0.3624129593372345,
14626
- "eval_runtime": 0.9461,
14627
- "eval_samples_per_second": 292.771,
14628
- "eval_steps_per_second": 36.993,
14629
  "step": 19600
14630
  },
14631
  {
@@ -14633,9 +14633,9 @@
14633
  "step": 19600,
14634
  "total_flos": 5.678990728814592e+17,
14635
  "train_loss": 0.30055975163317455,
14636
- "train_runtime": 936.3063,
14637
- "train_samples_per_second": 167.253,
14638
- "train_steps_per_second": 20.933
14639
  }
14640
  ],
14641
  "logging_steps": 10,
 
1
  {
2
  "best_metric": 0.26566287875175476,
3
+ "best_model_checkpoint": "./cocoa_outputs_resnet/checkpoint-6468",
4
  "epoch": 100.0,
5
  "eval_steps": 500,
6
  "global_step": 19600,
 
145
  "epoch": 1.0,
146
  "eval_accuracy": 0.5595667870036101,
147
  "eval_loss": 1.5222723484039307,
148
+ "eval_runtime": 0.9569,
149
+ "eval_samples_per_second": 289.486,
150
+ "eval_steps_per_second": 36.578,
151
  "step": 196
152
  },
153
  {
 
294
  "epoch": 2.0,
295
  "eval_accuracy": 0.8303249097472925,
296
  "eval_loss": 0.8974758386611938,
297
+ "eval_runtime": 0.934,
298
+ "eval_samples_per_second": 296.569,
299
+ "eval_steps_per_second": 37.473,
300
  "step": 392
301
  },
302
  {
 
436
  "epoch": 3.0,
437
  "eval_accuracy": 0.8772563176895307,
438
  "eval_loss": 0.6563544273376465,
439
+ "eval_runtime": 0.936,
440
+ "eval_samples_per_second": 295.927,
441
+ "eval_steps_per_second": 37.391,
442
  "step": 588
443
  },
444
  {
 
585
  "epoch": 4.0,
586
  "eval_accuracy": 0.8339350180505415,
587
  "eval_loss": 0.6841569542884827,
588
+ "eval_runtime": 0.9273,
589
+ "eval_samples_per_second": 298.728,
590
+ "eval_steps_per_second": 37.745,
591
  "step": 784
592
  },
593
  {
 
734
  "epoch": 5.0,
735
  "eval_accuracy": 0.8808664259927798,
736
  "eval_loss": 0.48941850662231445,
737
+ "eval_runtime": 0.935,
738
+ "eval_samples_per_second": 296.252,
739
+ "eval_steps_per_second": 37.433,
740
  "step": 980
741
  },
742
  {
 
876
  "epoch": 6.0,
877
  "eval_accuracy": 0.8736462093862816,
878
  "eval_loss": 0.41603580117225647,
879
+ "eval_runtime": 0.9296,
880
+ "eval_samples_per_second": 297.99,
881
+ "eval_steps_per_second": 37.652,
882
  "step": 1176
883
  },
884
  {
 
1025
  "epoch": 7.0,
1026
  "eval_accuracy": 0.8844765342960289,
1027
  "eval_loss": 0.40221381187438965,
1028
+ "eval_runtime": 0.9298,
1029
+ "eval_samples_per_second": 297.902,
1030
+ "eval_steps_per_second": 37.641,
1031
  "step": 1372
1032
  },
1033
  {
 
1167
  "epoch": 8.0,
1168
  "eval_accuracy": 0.8411552346570397,
1169
  "eval_loss": 0.4939042627811432,
1170
+ "eval_runtime": 0.9311,
1171
+ "eval_samples_per_second": 297.494,
1172
+ "eval_steps_per_second": 37.589,
1173
  "step": 1568
1174
  },
1175
  {
 
1316
  "epoch": 9.0,
1317
  "eval_accuracy": 0.8772563176895307,
1318
  "eval_loss": 0.35403916239738464,
1319
+ "eval_runtime": 0.9315,
1320
+ "eval_samples_per_second": 297.362,
1321
+ "eval_steps_per_second": 37.573,
1322
  "step": 1764
1323
  },
1324
  {
 
1465
  "epoch": 10.0,
1466
  "eval_accuracy": 0.8953068592057761,
1467
  "eval_loss": 0.349290668964386,
1468
+ "eval_runtime": 0.9365,
1469
+ "eval_samples_per_second": 295.793,
1470
+ "eval_steps_per_second": 37.375,
1471
  "step": 1960
1472
  },
1473
  {
 
1607
  "epoch": 11.0,
1608
  "eval_accuracy": 0.776173285198556,
1609
  "eval_loss": 0.7928438186645508,
1610
+ "eval_runtime": 0.9321,
1611
+ "eval_samples_per_second": 297.189,
1612
+ "eval_steps_per_second": 37.551,
1613
  "step": 2156
1614
  },
1615
  {
 
1756
  "epoch": 12.0,
1757
  "eval_accuracy": 0.296028880866426,
1758
  "eval_loss": 2.06593918800354,
1759
+ "eval_runtime": 0.9947,
1760
+ "eval_samples_per_second": 278.482,
1761
+ "eval_steps_per_second": 35.187,
1762
  "step": 2352
1763
  },
1764
  {
 
1898
  "epoch": 13.0,
1899
  "eval_accuracy": 0.851985559566787,
1900
  "eval_loss": 0.44439464807510376,
1901
+ "eval_runtime": 0.9289,
1902
+ "eval_samples_per_second": 298.212,
1903
+ "eval_steps_per_second": 37.68,
1904
  "step": 2548
1905
  },
1906
  {
 
2047
  "epoch": 14.0,
2048
  "eval_accuracy": 0.8736462093862816,
2049
  "eval_loss": 0.46400919556617737,
2050
+ "eval_runtime": 0.9937,
2051
+ "eval_samples_per_second": 278.754,
2052
+ "eval_steps_per_second": 35.222,
2053
  "step": 2744
2054
  },
2055
  {
 
2196
  "epoch": 15.0,
2197
  "eval_accuracy": 0.8772563176895307,
2198
  "eval_loss": 0.37753719091415405,
2199
+ "eval_runtime": 0.9317,
2200
+ "eval_samples_per_second": 297.316,
2201
+ "eval_steps_per_second": 37.567,
2202
  "step": 2940
2203
  },
2204
  {
 
2338
  "epoch": 16.0,
2339
  "eval_accuracy": 0.8880866425992779,
2340
  "eval_loss": 0.3519056737422943,
2341
+ "eval_runtime": 0.9334,
2342
+ "eval_samples_per_second": 296.766,
2343
+ "eval_steps_per_second": 37.498,
2344
  "step": 3136
2345
  },
2346
  {
 
2487
  "epoch": 17.0,
2488
  "eval_accuracy": 0.9061371841155235,
2489
  "eval_loss": 0.33103030920028687,
2490
+ "eval_runtime": 0.9376,
2491
+ "eval_samples_per_second": 295.446,
2492
+ "eval_steps_per_second": 37.331,
2493
  "step": 3332
2494
  },
2495
  {
 
2629
  "epoch": 18.0,
2630
  "eval_accuracy": 0.8916967509025271,
2631
  "eval_loss": 0.34751203656196594,
2632
+ "eval_runtime": 0.9366,
2633
+ "eval_samples_per_second": 295.765,
2634
+ "eval_steps_per_second": 37.371,
2635
  "step": 3528
2636
  },
2637
  {
 
2778
  "epoch": 19.0,
2779
  "eval_accuracy": 0.8592057761732852,
2780
  "eval_loss": 0.38391339778900146,
2781
+ "eval_runtime": 0.9352,
2782
+ "eval_samples_per_second": 296.2,
2783
+ "eval_steps_per_second": 37.426,
2784
  "step": 3724
2785
  },
2786
  {
 
2927
  "epoch": 20.0,
2928
  "eval_accuracy": 0.9133574007220217,
2929
  "eval_loss": 0.3031846880912781,
2930
+ "eval_runtime": 0.9346,
2931
+ "eval_samples_per_second": 296.374,
2932
+ "eval_steps_per_second": 37.448,
2933
  "step": 3920
2934
  },
2935
  {
 
3069
  "epoch": 21.0,
3070
  "eval_accuracy": 0.851985559566787,
3071
  "eval_loss": 0.4246116876602173,
3072
+ "eval_runtime": 0.9314,
3073
+ "eval_samples_per_second": 297.413,
3074
+ "eval_steps_per_second": 37.579,
3075
  "step": 4116
3076
  },
3077
  {
 
3218
  "epoch": 22.0,
3219
  "eval_accuracy": 0.8989169675090253,
3220
  "eval_loss": 0.29509276151657104,
3221
+ "eval_runtime": 0.9307,
3222
+ "eval_samples_per_second": 297.612,
3223
+ "eval_steps_per_second": 37.604,
3224
  "step": 4312
3225
  },
3226
  {
 
3360
  "epoch": 23.0,
3361
  "eval_accuracy": 0.851985559566787,
3362
  "eval_loss": 0.4356595277786255,
3363
+ "eval_runtime": 0.9603,
3364
+ "eval_samples_per_second": 288.437,
3365
+ "eval_steps_per_second": 36.445,
3366
  "step": 4508
3367
  },
3368
  {
 
3509
  "epoch": 24.0,
3510
  "eval_accuracy": 0.8916967509025271,
3511
  "eval_loss": 0.399036169052124,
3512
+ "eval_runtime": 0.9342,
3513
+ "eval_samples_per_second": 296.5,
3514
+ "eval_steps_per_second": 37.464,
3515
  "step": 4704
3516
  },
3517
  {
 
3658
  "epoch": 25.0,
3659
  "eval_accuracy": 0.9097472924187726,
3660
  "eval_loss": 0.35359257459640503,
3661
+ "eval_runtime": 0.9646,
3662
+ "eval_samples_per_second": 287.175,
3663
+ "eval_steps_per_second": 36.286,
3664
  "step": 4900
3665
  },
3666
  {
 
3800
  "epoch": 26.0,
3801
  "eval_accuracy": 0.8592057761732852,
3802
  "eval_loss": 0.4166140854358673,
3803
+ "eval_runtime": 0.9729,
3804
+ "eval_samples_per_second": 284.728,
3805
+ "eval_steps_per_second": 35.976,
3806
  "step": 5096
3807
  },
3808
  {
 
3949
  "epoch": 27.0,
3950
  "eval_accuracy": 0.851985559566787,
3951
  "eval_loss": 0.4353993237018585,
3952
+ "eval_runtime": 0.9398,
3953
+ "eval_samples_per_second": 294.757,
3954
+ "eval_steps_per_second": 37.244,
3955
  "step": 5292
3956
  },
3957
  {
 
4091
  "epoch": 28.0,
4092
  "eval_accuracy": 0.8592057761732852,
4093
  "eval_loss": 0.4088672697544098,
4094
+ "eval_runtime": 0.9406,
4095
+ "eval_samples_per_second": 294.489,
4096
+ "eval_steps_per_second": 37.21,
4097
  "step": 5488
4098
  },
4099
  {
 
4240
  "epoch": 29.0,
4241
  "eval_accuracy": 0.8231046931407943,
4242
  "eval_loss": 0.4787161946296692,
4243
+ "eval_runtime": 0.933,
4244
+ "eval_samples_per_second": 296.9,
4245
+ "eval_steps_per_second": 37.514,
4246
  "step": 5684
4247
  },
4248
  {
 
4389
  "epoch": 30.0,
4390
  "eval_accuracy": 0.9097472924187726,
4391
  "eval_loss": 0.3165305256843567,
4392
+ "eval_runtime": 0.9292,
4393
+ "eval_samples_per_second": 298.12,
4394
+ "eval_steps_per_second": 37.669,
4395
  "step": 5880
4396
  },
4397
  {
 
4531
  "epoch": 31.0,
4532
  "eval_accuracy": 0.9133574007220217,
4533
  "eval_loss": 0.31053850054740906,
4534
+ "eval_runtime": 0.9345,
4535
+ "eval_samples_per_second": 296.427,
4536
+ "eval_steps_per_second": 37.455,
4537
  "step": 6076
4538
  },
4539
  {
 
4680
  "epoch": 32.0,
4681
  "eval_accuracy": 0.9061371841155235,
4682
  "eval_loss": 0.3559906780719757,
4683
+ "eval_runtime": 0.9353,
4684
+ "eval_samples_per_second": 296.174,
4685
+ "eval_steps_per_second": 37.423,
4686
  "step": 6272
4687
  },
4688
  {
 
4822
  "epoch": 33.0,
4823
  "eval_accuracy": 0.9097472924187726,
4824
  "eval_loss": 0.26566287875175476,
4825
+ "eval_runtime": 0.9334,
4826
+ "eval_samples_per_second": 296.762,
4827
+ "eval_steps_per_second": 37.497,
4828
  "step": 6468
4829
  },
4830
  {
 
4971
  "epoch": 34.0,
4972
  "eval_accuracy": 0.9133574007220217,
4973
  "eval_loss": 0.2679595947265625,
4974
+ "eval_runtime": 0.936,
4975
+ "eval_samples_per_second": 295.944,
4976
+ "eval_steps_per_second": 37.394,
4977
  "step": 6664
4978
  },
4979
  {
 
5120
  "epoch": 35.0,
5121
  "eval_accuracy": 0.9061371841155235,
5122
  "eval_loss": 0.3797638416290283,
5123
+ "eval_runtime": 0.9298,
5124
+ "eval_samples_per_second": 297.901,
5125
+ "eval_steps_per_second": 37.641,
5126
  "step": 6860
5127
  },
5128
  {
 
5262
  "epoch": 36.0,
5263
  "eval_accuracy": 0.855595667870036,
5264
  "eval_loss": 0.5098311305046082,
5265
+ "eval_runtime": 0.9428,
5266
+ "eval_samples_per_second": 293.818,
5267
+ "eval_steps_per_second": 37.125,
5268
  "step": 7056
5269
  },
5270
  {
 
5411
  "epoch": 37.0,
5412
  "eval_accuracy": 0.8808664259927798,
5413
  "eval_loss": 0.42190420627593994,
5414
+ "eval_runtime": 0.9304,
5415
+ "eval_samples_per_second": 297.732,
5416
+ "eval_steps_per_second": 37.62,
5417
  "step": 7252
5418
  },
5419
  {
 
5553
  "epoch": 38.0,
5554
  "eval_accuracy": 0.9133574007220217,
5555
  "eval_loss": 0.2851579189300537,
5556
+ "eval_runtime": 0.9753,
5557
+ "eval_samples_per_second": 284.019,
5558
+ "eval_steps_per_second": 35.887,
5559
  "step": 7448
5560
  },
5561
  {
 
5702
  "epoch": 39.0,
5703
  "eval_accuracy": 0.8989169675090253,
5704
  "eval_loss": 0.36030298471450806,
5705
+ "eval_runtime": 0.9403,
5706
+ "eval_samples_per_second": 294.598,
5707
+ "eval_steps_per_second": 37.224,
5708
  "step": 7644
5709
  },
5710
  {
 
5851
  "epoch": 40.0,
5852
  "eval_accuracy": 0.8736462093862816,
5853
  "eval_loss": 0.351894736289978,
5854
+ "eval_runtime": 0.9415,
5855
+ "eval_samples_per_second": 294.212,
5856
+ "eval_steps_per_second": 37.175,
5857
  "step": 7840
5858
  },
5859
  {
 
5993
  "epoch": 41.0,
5994
  "eval_accuracy": 0.9025270758122743,
5995
  "eval_loss": 0.3343473970890045,
5996
+ "eval_runtime": 0.9379,
5997
+ "eval_samples_per_second": 295.341,
5998
+ "eval_steps_per_second": 37.317,
5999
  "step": 8036
6000
  },
6001
  {
 
6142
  "epoch": 42.0,
6143
  "eval_accuracy": 0.9169675090252708,
6144
  "eval_loss": 0.3383941352367401,
6145
+ "eval_runtime": 0.9348,
6146
+ "eval_samples_per_second": 296.313,
6147
+ "eval_steps_per_second": 37.44,
6148
  "step": 8232
6149
  },
6150
  {
 
6284
  "epoch": 43.0,
6285
  "eval_accuracy": 0.8772563176895307,
6286
  "eval_loss": 0.40458711981773376,
6287
+ "eval_runtime": 0.9383,
6288
+ "eval_samples_per_second": 295.207,
6289
+ "eval_steps_per_second": 37.301,
6290
  "step": 8428
6291
  },
6292
  {
 
6433
  "epoch": 44.0,
6434
  "eval_accuracy": 0.8916967509025271,
6435
  "eval_loss": 0.39525121450424194,
6436
+ "eval_runtime": 0.9341,
6437
+ "eval_samples_per_second": 296.557,
6438
+ "eval_steps_per_second": 37.471,
6439
  "step": 8624
6440
  },
6441
  {
 
6582
  "epoch": 45.0,
6583
  "eval_accuracy": 0.8592057761732852,
6584
  "eval_loss": 0.5002943873405457,
6585
+ "eval_runtime": 0.9313,
6586
+ "eval_samples_per_second": 297.43,
6587
+ "eval_steps_per_second": 37.581,
6588
  "step": 8820
6589
  },
6590
  {
 
6724
  "epoch": 46.0,
6725
  "eval_accuracy": 0.9169675090252708,
6726
  "eval_loss": 0.3231888711452484,
6727
+ "eval_runtime": 0.9353,
6728
+ "eval_samples_per_second": 296.162,
6729
+ "eval_steps_per_second": 37.421,
6730
  "step": 9016
6731
  },
6732
  {
 
6873
  "epoch": 47.0,
6874
  "eval_accuracy": 0.9169675090252708,
6875
  "eval_loss": 0.3112559914588928,
6876
+ "eval_runtime": 0.9287,
6877
+ "eval_samples_per_second": 298.262,
6878
+ "eval_steps_per_second": 37.687,
6879
  "step": 9212
6880
  },
6881
  {
 
7015
  "epoch": 48.0,
7016
  "eval_accuracy": 0.855595667870036,
7017
  "eval_loss": 0.4494384229183197,
7018
+ "eval_runtime": 0.928,
7019
+ "eval_samples_per_second": 298.494,
7020
+ "eval_steps_per_second": 37.716,
7021
  "step": 9408
7022
  },
7023
  {
 
7164
  "epoch": 49.0,
7165
  "eval_accuracy": 0.9205776173285198,
7166
  "eval_loss": 0.37217509746551514,
7167
+ "eval_runtime": 0.9297,
7168
+ "eval_samples_per_second": 297.952,
7169
+ "eval_steps_per_second": 37.647,
7170
  "step": 9604
7171
  },
7172
  {
 
7313
  "epoch": 50.0,
7314
  "eval_accuracy": 0.9097472924187726,
7315
  "eval_loss": 0.2852139472961426,
7316
+ "eval_runtime": 0.9306,
7317
+ "eval_samples_per_second": 297.668,
7318
+ "eval_steps_per_second": 37.611,
7319
  "step": 9800
7320
  },
7321
  {
 
7455
  "epoch": 51.0,
7456
  "eval_accuracy": 0.8628158844765343,
7457
  "eval_loss": 0.4137951135635376,
7458
+ "eval_runtime": 0.9371,
7459
+ "eval_samples_per_second": 295.604,
7460
+ "eval_steps_per_second": 37.351,
7461
  "step": 9996
7462
  },
7463
  {
 
7604
  "epoch": 52.0,
7605
  "eval_accuracy": 0.8953068592057761,
7606
  "eval_loss": 0.34130236506462097,
7607
+ "eval_runtime": 0.9387,
7608
+ "eval_samples_per_second": 295.092,
7609
+ "eval_steps_per_second": 37.286,
7610
  "step": 10192
7611
  },
7612
  {
 
7746
  "epoch": 53.0,
7747
  "eval_accuracy": 0.9169675090252708,
7748
  "eval_loss": 0.30462250113487244,
7749
+ "eval_runtime": 0.9357,
7750
+ "eval_samples_per_second": 296.019,
7751
+ "eval_steps_per_second": 37.403,
7752
  "step": 10388
7753
  },
7754
  {
 
7895
  "epoch": 54.0,
7896
  "eval_accuracy": 0.8989169675090253,
7897
  "eval_loss": 0.2849152684211731,
7898
+ "eval_runtime": 0.9334,
7899
+ "eval_samples_per_second": 296.775,
7900
+ "eval_steps_per_second": 37.499,
7901
  "step": 10584
7902
  },
7903
  {
 
8044
  "epoch": 55.0,
8045
  "eval_accuracy": 0.9133574007220217,
8046
  "eval_loss": 0.35168057680130005,
8047
+ "eval_runtime": 0.9361,
8048
+ "eval_samples_per_second": 295.907,
8049
+ "eval_steps_per_second": 37.389,
8050
  "step": 10780
8051
  },
8052
  {
 
8186
  "epoch": 56.0,
8187
  "eval_accuracy": 0.9025270758122743,
8188
  "eval_loss": 0.45381447672843933,
8189
+ "eval_runtime": 0.9344,
8190
+ "eval_samples_per_second": 296.45,
8191
+ "eval_steps_per_second": 37.458,
8192
  "step": 10976
8193
  },
8194
  {
 
8335
  "epoch": 57.0,
8336
  "eval_accuracy": 0.8592057761732852,
8337
  "eval_loss": 0.44916799664497375,
8338
+ "eval_runtime": 0.9373,
8339
+ "eval_samples_per_second": 295.53,
8340
+ "eval_steps_per_second": 37.341,
8341
  "step": 11172
8342
  },
8343
  {
 
8477
  "epoch": 58.0,
8478
  "eval_accuracy": 0.8628158844765343,
8479
  "eval_loss": 0.4738902747631073,
8480
+ "eval_runtime": 0.9332,
8481
+ "eval_samples_per_second": 296.824,
8482
+ "eval_steps_per_second": 37.505,
8483
  "step": 11368
8484
  },
8485
  {
 
8626
  "epoch": 59.0,
8627
  "eval_accuracy": 0.9205776173285198,
8628
  "eval_loss": 0.2831103205680847,
8629
+ "eval_runtime": 0.9316,
8630
+ "eval_samples_per_second": 297.324,
8631
+ "eval_steps_per_second": 37.568,
8632
  "step": 11564
8633
  },
8634
  {
 
8775
  "epoch": 60.0,
8776
  "eval_accuracy": 0.9205776173285198,
8777
  "eval_loss": 0.34654152393341064,
8778
+ "eval_runtime": 0.9298,
8779
+ "eval_samples_per_second": 297.899,
8780
+ "eval_steps_per_second": 37.641,
8781
  "step": 11760
8782
  },
8783
  {
 
8917
  "epoch": 61.0,
8918
  "eval_accuracy": 0.9314079422382672,
8919
  "eval_loss": 0.28843551874160767,
8920
+ "eval_runtime": 0.938,
8921
+ "eval_samples_per_second": 295.31,
8922
+ "eval_steps_per_second": 37.314,
8923
  "step": 11956
8924
  },
8925
  {
 
9066
  "epoch": 62.0,
9067
  "eval_accuracy": 0.8447653429602888,
9068
  "eval_loss": 0.4874745309352875,
9069
+ "eval_runtime": 0.935,
9070
+ "eval_samples_per_second": 296.251,
9071
+ "eval_steps_per_second": 37.432,
9072
  "step": 12152
9073
  },
9074
  {
 
9208
  "epoch": 63.0,
9209
  "eval_accuracy": 0.9061371841155235,
9210
  "eval_loss": 0.3988655209541321,
9211
+ "eval_runtime": 0.9339,
9212
+ "eval_samples_per_second": 296.617,
9213
+ "eval_steps_per_second": 37.479,
9214
  "step": 12348
9215
  },
9216
  {
 
9357
  "epoch": 64.0,
9358
  "eval_accuracy": 0.851985559566787,
9359
  "eval_loss": 0.5952923893928528,
9360
+ "eval_runtime": 0.9334,
9361
+ "eval_samples_per_second": 296.767,
9362
+ "eval_steps_per_second": 37.498,
9363
  "step": 12544
9364
  },
9365
  {
 
9506
  "epoch": 65.0,
9507
  "eval_accuracy": 0.927797833935018,
9508
  "eval_loss": 0.2953914701938629,
9509
+ "eval_runtime": 0.9948,
9510
+ "eval_samples_per_second": 278.444,
9511
+ "eval_steps_per_second": 35.183,
9512
  "step": 12740
9513
  },
9514
  {
 
9648
  "epoch": 66.0,
9649
  "eval_accuracy": 0.851985559566787,
9650
  "eval_loss": 0.5033073425292969,
9651
+ "eval_runtime": 0.9324,
9652
+ "eval_samples_per_second": 297.09,
9653
+ "eval_steps_per_second": 37.538,
9654
  "step": 12936
9655
  },
9656
  {
 
9797
  "epoch": 67.0,
9798
  "eval_accuracy": 0.8808664259927798,
9799
  "eval_loss": 0.41321179270744324,
9800
+ "eval_runtime": 0.9337,
9801
+ "eval_samples_per_second": 296.681,
9802
+ "eval_steps_per_second": 37.487,
9803
  "step": 13132
9804
  },
9805
  {
 
9939
  "epoch": 68.0,
9940
  "eval_accuracy": 0.9169675090252708,
9941
  "eval_loss": 0.37430626153945923,
9942
+ "eval_runtime": 0.9326,
9943
+ "eval_samples_per_second": 297.033,
9944
+ "eval_steps_per_second": 37.531,
9945
  "step": 13328
9946
  },
9947
  {
 
10088
  "epoch": 69.0,
10089
  "eval_accuracy": 0.776173285198556,
10090
  "eval_loss": 0.6423271298408508,
10091
+ "eval_runtime": 0.9344,
10092
+ "eval_samples_per_second": 296.457,
10093
+ "eval_steps_per_second": 37.458,
10094
  "step": 13524
10095
  },
10096
  {
 
10237
  "epoch": 70.0,
10238
  "eval_accuracy": 0.8014440433212996,
10239
  "eval_loss": 0.5979345440864563,
10240
+ "eval_runtime": 0.9413,
10241
+ "eval_samples_per_second": 294.271,
10242
+ "eval_steps_per_second": 37.182,
10243
  "step": 13720
10244
  },
10245
  {
 
10379
  "epoch": 71.0,
10380
  "eval_accuracy": 0.8989169675090253,
10381
  "eval_loss": 0.43981537222862244,
10382
+ "eval_runtime": 0.9369,
10383
+ "eval_samples_per_second": 295.663,
10384
+ "eval_steps_per_second": 37.358,
10385
  "step": 13916
10386
  },
10387
  {
 
10528
  "epoch": 72.0,
10529
  "eval_accuracy": 0.8231046931407943,
10530
  "eval_loss": 0.5633912086486816,
10531
+ "eval_runtime": 0.9331,
10532
+ "eval_samples_per_second": 296.846,
10533
+ "eval_steps_per_second": 37.508,
10534
  "step": 14112
10535
  },
10536
  {
 
10670
  "epoch": 73.0,
10671
  "eval_accuracy": 0.776173285198556,
10672
  "eval_loss": 0.620398223400116,
10673
+ "eval_runtime": 0.9369,
10674
+ "eval_samples_per_second": 295.645,
10675
+ "eval_steps_per_second": 37.356,
10676
  "step": 14308
10677
  },
10678
  {
 
10819
  "epoch": 74.0,
10820
  "eval_accuracy": 0.8953068592057761,
10821
  "eval_loss": 0.36853671073913574,
10822
+ "eval_runtime": 0.9373,
10823
+ "eval_samples_per_second": 295.515,
10824
+ "eval_steps_per_second": 37.339,
10825
  "step": 14504
10826
  },
10827
  {
 
10968
  "epoch": 75.0,
10969
  "eval_accuracy": 0.8158844765342961,
10970
  "eval_loss": 0.7026161551475525,
10971
+ "eval_runtime": 0.9279,
10972
+ "eval_samples_per_second": 298.519,
10973
+ "eval_steps_per_second": 37.719,
10974
  "step": 14700
10975
  },
10976
  {
 
11110
  "epoch": 76.0,
11111
  "eval_accuracy": 0.9169675090252708,
11112
  "eval_loss": 0.40481600165367126,
11113
+ "eval_runtime": 0.9401,
11114
+ "eval_samples_per_second": 294.635,
11115
+ "eval_steps_per_second": 37.228,
11116
  "step": 14896
11117
  },
11118
  {
 
11259
  "epoch": 77.0,
11260
  "eval_accuracy": 0.8844765342960289,
11261
  "eval_loss": 0.48912858963012695,
11262
+ "eval_runtime": 0.9257,
11263
+ "eval_samples_per_second": 299.23,
11264
+ "eval_steps_per_second": 37.809,
11265
  "step": 15092
11266
  },
11267
  {
 
11401
  "epoch": 78.0,
11402
  "eval_accuracy": 0.8772563176895307,
11403
  "eval_loss": 0.42159637808799744,
11404
+ "eval_runtime": 0.9931,
11405
+ "eval_samples_per_second": 278.916,
11406
+ "eval_steps_per_second": 35.242,
11407
  "step": 15288
11408
  },
11409
  {
 
11550
  "epoch": 79.0,
11551
  "eval_accuracy": 0.8953068592057761,
11552
  "eval_loss": 0.2720978558063507,
11553
+ "eval_runtime": 0.9347,
11554
+ "eval_samples_per_second": 296.358,
11555
+ "eval_steps_per_second": 37.446,
11556
  "step": 15484
11557
  },
11558
  {
 
11699
  "epoch": 80.0,
11700
  "eval_accuracy": 0.8483754512635379,
11701
  "eval_loss": 0.42701977491378784,
11702
+ "eval_runtime": 0.9306,
11703
+ "eval_samples_per_second": 297.657,
11704
+ "eval_steps_per_second": 37.61,
11705
  "step": 15680
11706
  },
11707
  {
 
11841
  "epoch": 81.0,
11842
  "eval_accuracy": 0.7833935018050542,
11843
  "eval_loss": 0.763225793838501,
11844
+ "eval_runtime": 0.9357,
11845
+ "eval_samples_per_second": 296.038,
11846
+ "eval_steps_per_second": 37.405,
11847
  "step": 15876
11848
  },
11849
  {
 
11990
  "epoch": 82.0,
11991
  "eval_accuracy": 0.9025270758122743,
11992
  "eval_loss": 0.3249270021915436,
11993
+ "eval_runtime": 0.9334,
11994
+ "eval_samples_per_second": 296.754,
11995
+ "eval_steps_per_second": 37.496,
11996
  "step": 16072
11997
  },
11998
  {
 
12132
  "epoch": 83.0,
12133
  "eval_accuracy": 0.8989169675090253,
12134
  "eval_loss": 0.38384127616882324,
12135
+ "eval_runtime": 0.9338,
12136
+ "eval_samples_per_second": 296.64,
12137
+ "eval_steps_per_second": 37.482,
12138
  "step": 16268
12139
  },
12140
  {
 
12281
  "epoch": 84.0,
12282
  "eval_accuracy": 0.9205776173285198,
12283
  "eval_loss": 0.3329784572124481,
12284
+ "eval_runtime": 0.9338,
12285
+ "eval_samples_per_second": 296.638,
12286
+ "eval_steps_per_second": 37.481,
12287
  "step": 16464
12288
  },
12289
  {
 
12430
  "epoch": 85.0,
12431
  "eval_accuracy": 0.8700361010830325,
12432
  "eval_loss": 0.32456666231155396,
12433
+ "eval_runtime": 0.9335,
12434
+ "eval_samples_per_second": 296.719,
12435
+ "eval_steps_per_second": 37.492,
12436
  "step": 16660
12437
  },
12438
  {
 
12572
  "epoch": 86.0,
12573
  "eval_accuracy": 0.8736462093862816,
12574
  "eval_loss": 0.3710058927536011,
12575
+ "eval_runtime": 0.9462,
12576
+ "eval_samples_per_second": 292.762,
12577
+ "eval_steps_per_second": 36.992,
12578
  "step": 16856
12579
  },
12580
  {
 
12721
  "epoch": 87.0,
12722
  "eval_accuracy": 0.9061371841155235,
12723
  "eval_loss": 0.33839184045791626,
12724
+ "eval_runtime": 0.9931,
12725
+ "eval_samples_per_second": 278.938,
12726
+ "eval_steps_per_second": 35.245,
12727
  "step": 17052
12728
  },
12729
  {
 
12863
  "epoch": 88.0,
12864
  "eval_accuracy": 0.9097472924187726,
12865
  "eval_loss": 0.3703186511993408,
12866
+ "eval_runtime": 0.9324,
12867
+ "eval_samples_per_second": 297.094,
12868
+ "eval_steps_per_second": 37.539,
12869
  "step": 17248
12870
  },
12871
  {
 
13012
  "epoch": 89.0,
13013
  "eval_accuracy": 0.8592057761732852,
13014
  "eval_loss": 0.5013492703437805,
13015
+ "eval_runtime": 0.9311,
13016
+ "eval_samples_per_second": 297.495,
13017
+ "eval_steps_per_second": 37.59,
13018
  "step": 17444
13019
  },
13020
  {
 
13161
  "epoch": 90.0,
13162
  "eval_accuracy": 0.8989169675090253,
13163
  "eval_loss": 0.3456423580646515,
13164
+ "eval_runtime": 0.9297,
13165
+ "eval_samples_per_second": 297.96,
13166
+ "eval_steps_per_second": 37.648,
13167
  "step": 17640
13168
  },
13169
  {
 
13303
  "epoch": 91.0,
13304
  "eval_accuracy": 0.8880866425992779,
13305
  "eval_loss": 0.3798539340496063,
13306
+ "eval_runtime": 0.9367,
13307
+ "eval_samples_per_second": 295.72,
13308
+ "eval_steps_per_second": 37.365,
13309
  "step": 17836
13310
  },
13311
  {
 
13452
  "epoch": 92.0,
13453
  "eval_accuracy": 0.9061371841155235,
13454
  "eval_loss": 0.32391440868377686,
13455
+ "eval_runtime": 0.9318,
13456
+ "eval_samples_per_second": 297.278,
13457
+ "eval_steps_per_second": 37.562,
13458
  "step": 18032
13459
  },
13460
  {
 
13594
  "epoch": 93.0,
13595
  "eval_accuracy": 0.8989169675090253,
13596
  "eval_loss": 0.4861180782318115,
13597
+ "eval_runtime": 0.9969,
13598
+ "eval_samples_per_second": 277.851,
13599
+ "eval_steps_per_second": 35.107,
13600
  "step": 18228
13601
  },
13602
  {
 
13743
  "epoch": 94.0,
13744
  "eval_accuracy": 0.8736462093862816,
13745
  "eval_loss": 0.4443919062614441,
13746
+ "eval_runtime": 0.9334,
13747
+ "eval_samples_per_second": 296.762,
13748
+ "eval_steps_per_second": 37.497,
13749
  "step": 18424
13750
  },
13751
  {
 
13892
  "epoch": 95.0,
13893
  "eval_accuracy": 0.8844765342960289,
13894
  "eval_loss": 0.3712524473667145,
13895
+ "eval_runtime": 0.9337,
13896
+ "eval_samples_per_second": 296.658,
13897
+ "eval_steps_per_second": 37.484,
13898
  "step": 18620
13899
  },
13900
  {
 
14034
  "epoch": 96.0,
14035
  "eval_accuracy": 0.8303249097472925,
14036
  "eval_loss": 0.427941232919693,
14037
+ "eval_runtime": 0.9388,
14038
+ "eval_samples_per_second": 295.043,
14039
+ "eval_steps_per_second": 37.28,
14040
  "step": 18816
14041
  },
14042
  {
 
14183
  "epoch": 97.0,
14184
  "eval_accuracy": 0.8411552346570397,
14185
  "eval_loss": 0.6587985157966614,
14186
+ "eval_runtime": 0.9391,
14187
+ "eval_samples_per_second": 294.975,
14188
+ "eval_steps_per_second": 37.271,
14189
  "step": 19012
14190
  },
14191
  {
 
14325
  "epoch": 98.0,
14326
  "eval_accuracy": 0.8267148014440433,
14327
  "eval_loss": 0.66323322057724,
14328
+ "eval_runtime": 0.9369,
14329
+ "eval_samples_per_second": 295.657,
14330
+ "eval_steps_per_second": 37.357,
14331
  "step": 19208
14332
  },
14333
  {
 
14474
  "epoch": 99.0,
14475
  "eval_accuracy": 0.8808664259927798,
14476
  "eval_loss": 0.4641692638397217,
14477
+ "eval_runtime": 0.9404,
14478
+ "eval_samples_per_second": 294.555,
14479
+ "eval_steps_per_second": 37.218,
14480
  "step": 19404
14481
  },
14482
  {
 
14623
  "epoch": 100.0,
14624
  "eval_accuracy": 0.8808664259927798,
14625
  "eval_loss": 0.3624129593372345,
14626
+ "eval_runtime": 1.0032,
14627
+ "eval_samples_per_second": 276.121,
14628
+ "eval_steps_per_second": 34.889,
14629
  "step": 19600
14630
  },
14631
  {
 
14633
  "step": 19600,
14634
  "total_flos": 5.678990728814592e+17,
14635
  "train_loss": 0.30055975163317455,
14636
+ "train_runtime": 949.6972,
14637
+ "train_samples_per_second": 164.895,
14638
+ "train_steps_per_second": 20.638
14639
  }
14640
  ],
14641
  "logging_steps": 10,