mmomm25 commited on
Commit
384ab1e
1 Parent(s): 07cff62

Training in progress, epoch 1

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a5351ced59e7c85a3fb2f7c177c877ac1785f0eb288bcfa15c371ef575b43f0b
3
  size 343230128
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8e25373df5edc238dbf538c9d6b0eeeb1d527cd776721216fef2c7d314232c2
3
  size 343230128
tmp-checkpoint-2229/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f2316bdb1deff163ab2930bf8225abb0555747d3664b366ce6dfebcfeacb3622
3
  size 343230128
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8e25373df5edc238dbf538c9d6b0eeeb1d527cd776721216fef2c7d314232c2
3
  size 343230128
tmp-checkpoint-2229/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e3df57ff553da5450e2fe19f5d0c98c110c6698d31401453cd55874f6eed9654
3
  size 686581178
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e972e37b1f13e734ce46b658d36de5f30f061caa4f586079e212207c93fc8dd
3
  size 686581178
tmp-checkpoint-2229/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5c08dcbff6a5bd2d0801a11b6843f11bff78dee9b388ac334253c4cb377b9833
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1b00a69c9e2038884d6befb4def6f17cd678049897fe0c09478e144d8dec956
3
  size 14244
tmp-checkpoint-2229/trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.2440667599439621,
3
  "best_model_checkpoint": "vit-base-patch16-224-in21k-crack-detectorVITmain50epochs\\checkpoint-2229",
4
  "epoch": 1.9995514689392242,
5
  "eval_steps": 500,
@@ -11,1373 +11,1373 @@
11
  {
12
  "epoch": 0.01,
13
  "learning_rate": 8.976660682226213e-08,
14
- "loss": 1.3944,
15
  "step": 10
16
  },
17
  {
18
  "epoch": 0.02,
19
  "learning_rate": 1.7953321364452426e-07,
20
- "loss": 1.3875,
21
  "step": 20
22
  },
23
  {
24
  "epoch": 0.03,
25
  "learning_rate": 2.692998204667864e-07,
26
- "loss": 1.3999,
27
  "step": 30
28
  },
29
  {
30
  "epoch": 0.04,
31
  "learning_rate": 3.590664272890485e-07,
32
- "loss": 1.3915,
33
  "step": 40
34
  },
35
  {
36
  "epoch": 0.04,
37
  "learning_rate": 4.4883303411131064e-07,
38
- "loss": 1.3856,
39
  "step": 50
40
  },
41
  {
42
  "epoch": 0.05,
43
  "learning_rate": 5.385996409335728e-07,
44
- "loss": 1.3912,
45
  "step": 60
46
  },
47
  {
48
  "epoch": 0.06,
49
  "learning_rate": 6.283662477558349e-07,
50
- "loss": 1.3902,
51
  "step": 70
52
  },
53
  {
54
  "epoch": 0.07,
55
  "learning_rate": 7.18132854578097e-07,
56
- "loss": 1.3851,
57
  "step": 80
58
  },
59
  {
60
  "epoch": 0.08,
61
  "learning_rate": 8.078994614003591e-07,
62
- "loss": 1.3755,
63
  "step": 90
64
  },
65
  {
66
  "epoch": 0.09,
67
  "learning_rate": 8.976660682226213e-07,
68
- "loss": 1.3793,
69
  "step": 100
70
  },
71
  {
72
  "epoch": 0.1,
73
  "learning_rate": 9.874326750448833e-07,
74
- "loss": 1.3737,
75
  "step": 110
76
  },
77
  {
78
  "epoch": 0.11,
79
  "learning_rate": 1.0771992818671456e-06,
80
- "loss": 1.3736,
81
  "step": 120
82
  },
83
  {
84
  "epoch": 0.12,
85
  "learning_rate": 1.1669658886894075e-06,
86
- "loss": 1.3678,
87
  "step": 130
88
  },
89
  {
90
  "epoch": 0.13,
91
  "learning_rate": 1.2567324955116697e-06,
92
- "loss": 1.3637,
93
  "step": 140
94
  },
95
  {
96
  "epoch": 0.13,
97
  "learning_rate": 1.3464991023339318e-06,
98
- "loss": 1.357,
99
  "step": 150
100
  },
101
  {
102
  "epoch": 0.14,
103
  "learning_rate": 1.436265709156194e-06,
104
- "loss": 1.3583,
105
  "step": 160
106
  },
107
  {
108
  "epoch": 0.15,
109
  "learning_rate": 1.5260323159784561e-06,
110
- "loss": 1.361,
111
  "step": 170
112
  },
113
  {
114
  "epoch": 0.16,
115
  "learning_rate": 1.6157989228007182e-06,
116
- "loss": 1.3517,
117
  "step": 180
118
  },
119
  {
120
  "epoch": 0.17,
121
  "learning_rate": 1.7055655296229805e-06,
122
- "loss": 1.3543,
123
  "step": 190
124
  },
125
  {
126
  "epoch": 0.18,
127
  "learning_rate": 1.7953321364452425e-06,
128
- "loss": 1.3497,
129
  "step": 200
130
  },
131
  {
132
  "epoch": 0.19,
133
  "learning_rate": 1.8850987432675046e-06,
134
- "loss": 1.3436,
135
  "step": 210
136
  },
137
  {
138
  "epoch": 0.2,
139
  "learning_rate": 1.9748653500897667e-06,
140
- "loss": 1.3304,
141
  "step": 220
142
  },
143
  {
144
  "epoch": 0.21,
145
  "learning_rate": 2.064631956912029e-06,
146
- "loss": 1.3262,
147
  "step": 230
148
  },
149
  {
150
  "epoch": 0.22,
151
  "learning_rate": 2.1543985637342912e-06,
152
- "loss": 1.3209,
153
  "step": 240
154
  },
155
  {
156
  "epoch": 0.22,
157
  "learning_rate": 2.244165170556553e-06,
158
- "loss": 1.3054,
159
  "step": 250
160
  },
161
  {
162
  "epoch": 0.23,
163
  "learning_rate": 2.333931777378815e-06,
164
- "loss": 1.3028,
165
  "step": 260
166
  },
167
  {
168
  "epoch": 0.24,
169
  "learning_rate": 2.423698384201077e-06,
170
- "loss": 1.2939,
171
  "step": 270
172
  },
173
  {
174
  "epoch": 0.25,
175
  "learning_rate": 2.5134649910233395e-06,
176
- "loss": 1.2894,
177
  "step": 280
178
  },
179
  {
180
  "epoch": 0.26,
181
  "learning_rate": 2.6032315978456015e-06,
182
- "loss": 1.2838,
183
  "step": 290
184
  },
185
  {
186
  "epoch": 0.27,
187
  "learning_rate": 2.6929982046678636e-06,
188
- "loss": 1.2625,
189
  "step": 300
190
  },
191
  {
192
  "epoch": 0.28,
193
  "learning_rate": 2.7827648114901257e-06,
194
- "loss": 1.2727,
195
  "step": 310
196
  },
197
  {
198
  "epoch": 0.29,
199
  "learning_rate": 2.872531418312388e-06,
200
- "loss": 1.2398,
201
  "step": 320
202
  },
203
  {
204
  "epoch": 0.3,
205
  "learning_rate": 2.9622980251346502e-06,
206
- "loss": 1.2267,
207
  "step": 330
208
  },
209
  {
210
  "epoch": 0.31,
211
  "learning_rate": 3.0520646319569123e-06,
212
- "loss": 1.2359,
213
  "step": 340
214
  },
215
  {
216
  "epoch": 0.31,
217
  "learning_rate": 3.1418312387791743e-06,
218
- "loss": 1.218,
219
  "step": 350
220
  },
221
  {
222
  "epoch": 0.32,
223
  "learning_rate": 3.2315978456014364e-06,
224
- "loss": 1.1877,
225
  "step": 360
226
  },
227
  {
228
  "epoch": 0.33,
229
  "learning_rate": 3.321364452423698e-06,
230
- "loss": 1.1764,
231
  "step": 370
232
  },
233
  {
234
  "epoch": 0.34,
235
  "learning_rate": 3.411131059245961e-06,
236
- "loss": 1.151,
237
  "step": 380
238
  },
239
  {
240
  "epoch": 0.35,
241
  "learning_rate": 3.500897666068223e-06,
242
- "loss": 1.1334,
243
  "step": 390
244
  },
245
  {
246
  "epoch": 0.36,
247
  "learning_rate": 3.590664272890485e-06,
248
- "loss": 1.1272,
249
  "step": 400
250
  },
251
  {
252
  "epoch": 0.37,
253
  "learning_rate": 3.680430879712747e-06,
254
- "loss": 1.1077,
255
  "step": 410
256
  },
257
  {
258
  "epoch": 0.38,
259
  "learning_rate": 3.770197486535009e-06,
260
- "loss": 1.1021,
261
  "step": 420
262
  },
263
  {
264
  "epoch": 0.39,
265
  "learning_rate": 3.859964093357271e-06,
266
- "loss": 1.0583,
267
  "step": 430
268
  },
269
  {
270
  "epoch": 0.39,
271
  "learning_rate": 3.949730700179533e-06,
272
- "loss": 1.0482,
273
  "step": 440
274
  },
275
  {
276
  "epoch": 0.4,
277
  "learning_rate": 4.039497307001795e-06,
278
- "loss": 1.0214,
279
  "step": 450
280
  },
281
  {
282
  "epoch": 0.41,
283
  "learning_rate": 4.129263913824058e-06,
284
- "loss": 1.0114,
285
  "step": 460
286
  },
287
  {
288
  "epoch": 0.42,
289
  "learning_rate": 4.21903052064632e-06,
290
- "loss": 1.0237,
291
  "step": 470
292
  },
293
  {
294
  "epoch": 0.43,
295
  "learning_rate": 4.3087971274685824e-06,
296
- "loss": 0.969,
297
  "step": 480
298
  },
299
  {
300
  "epoch": 0.44,
301
  "learning_rate": 4.3985637342908445e-06,
302
- "loss": 0.966,
303
  "step": 490
304
  },
305
  {
306
  "epoch": 0.45,
307
  "learning_rate": 4.488330341113106e-06,
308
- "loss": 0.9518,
309
  "step": 500
310
  },
311
  {
312
  "epoch": 0.46,
313
  "learning_rate": 4.578096947935368e-06,
314
- "loss": 0.9545,
315
  "step": 510
316
  },
317
  {
318
  "epoch": 0.47,
319
  "learning_rate": 4.66786355475763e-06,
320
- "loss": 0.9473,
321
  "step": 520
322
  },
323
  {
324
  "epoch": 0.48,
325
  "learning_rate": 4.757630161579892e-06,
326
- "loss": 0.9026,
327
  "step": 530
328
  },
329
  {
330
  "epoch": 0.48,
331
  "learning_rate": 4.847396768402154e-06,
332
- "loss": 0.8535,
333
  "step": 540
334
  },
335
  {
336
  "epoch": 0.49,
337
  "learning_rate": 4.937163375224417e-06,
338
- "loss": 0.8598,
339
  "step": 550
340
  },
341
  {
342
  "epoch": 0.5,
343
  "learning_rate": 5.026929982046679e-06,
344
- "loss": 0.8154,
345
  "step": 560
346
  },
347
  {
348
  "epoch": 0.51,
349
  "learning_rate": 5.116696588868941e-06,
350
- "loss": 0.8561,
351
  "step": 570
352
  },
353
  {
354
  "epoch": 0.52,
355
  "learning_rate": 5.206463195691203e-06,
356
- "loss": 0.7924,
357
  "step": 580
358
  },
359
  {
360
  "epoch": 0.53,
361
  "learning_rate": 5.296229802513465e-06,
362
- "loss": 0.7947,
363
  "step": 590
364
  },
365
  {
366
  "epoch": 0.54,
367
  "learning_rate": 5.385996409335727e-06,
368
- "loss": 0.7999,
369
  "step": 600
370
  },
371
  {
372
  "epoch": 0.55,
373
  "learning_rate": 5.475763016157989e-06,
374
- "loss": 0.7771,
375
  "step": 610
376
  },
377
  {
378
  "epoch": 0.56,
379
  "learning_rate": 5.565529622980251e-06,
380
- "loss": 0.7826,
381
  "step": 620
382
  },
383
  {
384
  "epoch": 0.57,
385
  "learning_rate": 5.655296229802514e-06,
386
- "loss": 0.7321,
387
  "step": 630
388
  },
389
  {
390
  "epoch": 0.57,
391
  "learning_rate": 5.745062836624776e-06,
392
- "loss": 0.7689,
393
  "step": 640
394
  },
395
  {
396
  "epoch": 0.58,
397
  "learning_rate": 5.834829443447038e-06,
398
- "loss": 0.7546,
399
  "step": 650
400
  },
401
  {
402
  "epoch": 0.59,
403
  "learning_rate": 5.9245960502693004e-06,
404
- "loss": 0.7336,
405
  "step": 660
406
  },
407
  {
408
  "epoch": 0.6,
409
  "learning_rate": 6.0143626570915625e-06,
410
- "loss": 0.6889,
411
  "step": 670
412
  },
413
  {
414
  "epoch": 0.61,
415
  "learning_rate": 6.1041292639138246e-06,
416
- "loss": 0.6996,
417
  "step": 680
418
  },
419
  {
420
  "epoch": 0.62,
421
  "learning_rate": 6.193895870736087e-06,
422
- "loss": 0.6994,
423
  "step": 690
424
  },
425
  {
426
  "epoch": 0.63,
427
  "learning_rate": 6.283662477558349e-06,
428
- "loss": 0.74,
429
  "step": 700
430
  },
431
  {
432
  "epoch": 0.64,
433
  "learning_rate": 6.373429084380611e-06,
434
- "loss": 0.711,
435
  "step": 710
436
  },
437
  {
438
  "epoch": 0.65,
439
  "learning_rate": 6.463195691202873e-06,
440
- "loss": 0.6765,
441
  "step": 720
442
  },
443
  {
444
  "epoch": 0.65,
445
  "learning_rate": 6.552962298025135e-06,
446
- "loss": 0.6717,
447
  "step": 730
448
  },
449
  {
450
  "epoch": 0.66,
451
  "learning_rate": 6.642728904847396e-06,
452
- "loss": 0.6776,
453
  "step": 740
454
  },
455
  {
456
  "epoch": 0.67,
457
  "learning_rate": 6.732495511669659e-06,
458
- "loss": 0.62,
459
  "step": 750
460
  },
461
  {
462
  "epoch": 0.68,
463
  "learning_rate": 6.822262118491922e-06,
464
- "loss": 0.6392,
465
  "step": 760
466
  },
467
  {
468
  "epoch": 0.69,
469
  "learning_rate": 6.912028725314183e-06,
470
- "loss": 0.62,
471
  "step": 770
472
  },
473
  {
474
  "epoch": 0.7,
475
  "learning_rate": 7.001795332136446e-06,
476
- "loss": 0.6103,
477
  "step": 780
478
  },
479
  {
480
  "epoch": 0.71,
481
  "learning_rate": 7.091561938958707e-06,
482
- "loss": 0.6504,
483
  "step": 790
484
  },
485
  {
486
  "epoch": 0.72,
487
  "learning_rate": 7.18132854578097e-06,
488
- "loss": 0.6126,
489
  "step": 800
490
  },
491
  {
492
  "epoch": 0.73,
493
  "learning_rate": 7.271095152603231e-06,
494
- "loss": 0.5707,
495
  "step": 810
496
  },
497
  {
498
  "epoch": 0.74,
499
  "learning_rate": 7.360861759425494e-06,
500
- "loss": 0.587,
501
  "step": 820
502
  },
503
  {
504
  "epoch": 0.74,
505
  "learning_rate": 7.4506283662477555e-06,
506
- "loss": 0.5684,
507
  "step": 830
508
  },
509
  {
510
  "epoch": 0.75,
511
  "learning_rate": 7.540394973070018e-06,
512
- "loss": 0.5586,
513
  "step": 840
514
  },
515
  {
516
  "epoch": 0.76,
517
  "learning_rate": 7.630161579892281e-06,
518
- "loss": 0.6074,
519
  "step": 850
520
  },
521
  {
522
  "epoch": 0.77,
523
  "learning_rate": 7.719928186714543e-06,
524
- "loss": 0.5638,
525
  "step": 860
526
  },
527
  {
528
  "epoch": 0.78,
529
  "learning_rate": 7.809694793536805e-06,
530
- "loss": 0.5952,
531
  "step": 870
532
  },
533
  {
534
  "epoch": 0.79,
535
  "learning_rate": 7.899461400359067e-06,
536
- "loss": 0.5647,
537
  "step": 880
538
  },
539
  {
540
  "epoch": 0.8,
541
  "learning_rate": 7.98922800718133e-06,
542
- "loss": 0.6049,
543
  "step": 890
544
  },
545
  {
546
  "epoch": 0.81,
547
  "learning_rate": 8.07899461400359e-06,
548
- "loss": 0.5525,
549
  "step": 900
550
  },
551
  {
552
  "epoch": 0.82,
553
  "learning_rate": 8.168761220825854e-06,
554
- "loss": 0.522,
555
  "step": 910
556
  },
557
  {
558
  "epoch": 0.83,
559
  "learning_rate": 8.258527827648117e-06,
560
- "loss": 0.5489,
561
  "step": 920
562
  },
563
  {
564
  "epoch": 0.83,
565
  "learning_rate": 8.348294434470378e-06,
566
- "loss": 0.5394,
567
  "step": 930
568
  },
569
  {
570
  "epoch": 0.84,
571
  "learning_rate": 8.43806104129264e-06,
572
- "loss": 0.5707,
573
  "step": 940
574
  },
575
  {
576
  "epoch": 0.85,
577
  "learning_rate": 8.527827648114902e-06,
578
- "loss": 0.5322,
579
  "step": 950
580
  },
581
  {
582
  "epoch": 0.86,
583
  "learning_rate": 8.617594254937165e-06,
584
- "loss": 0.5637,
585
  "step": 960
586
  },
587
  {
588
  "epoch": 0.87,
589
  "learning_rate": 8.707360861759426e-06,
590
- "loss": 0.529,
591
  "step": 970
592
  },
593
  {
594
  "epoch": 0.88,
595
  "learning_rate": 8.797127468581689e-06,
596
- "loss": 0.51,
597
  "step": 980
598
  },
599
  {
600
  "epoch": 0.89,
601
  "learning_rate": 8.88689407540395e-06,
602
- "loss": 0.4844,
603
  "step": 990
604
  },
605
  {
606
  "epoch": 0.9,
607
  "learning_rate": 8.976660682226211e-06,
608
- "loss": 0.5349,
609
  "step": 1000
610
  },
611
  {
612
  "epoch": 0.91,
613
  "learning_rate": 9.066427289048474e-06,
614
- "loss": 0.5377,
615
  "step": 1010
616
  },
617
  {
618
  "epoch": 0.92,
619
  "learning_rate": 9.156193895870736e-06,
620
- "loss": 0.4985,
621
  "step": 1020
622
  },
623
  {
624
  "epoch": 0.92,
625
  "learning_rate": 9.245960502692998e-06,
626
- "loss": 0.5533,
627
  "step": 1030
628
  },
629
  {
630
  "epoch": 0.93,
631
  "learning_rate": 9.33572710951526e-06,
632
- "loss": 0.4955,
633
  "step": 1040
634
  },
635
  {
636
  "epoch": 0.94,
637
  "learning_rate": 9.425493716337523e-06,
638
- "loss": 0.541,
639
  "step": 1050
640
  },
641
  {
642
  "epoch": 0.95,
643
  "learning_rate": 9.515260323159784e-06,
644
- "loss": 0.4757,
645
  "step": 1060
646
  },
647
  {
648
  "epoch": 0.96,
649
  "learning_rate": 9.605026929982047e-06,
650
- "loss": 0.5478,
651
  "step": 1070
652
  },
653
  {
654
  "epoch": 0.97,
655
  "learning_rate": 9.694793536804308e-06,
656
- "loss": 0.5281,
657
  "step": 1080
658
  },
659
  {
660
  "epoch": 0.98,
661
  "learning_rate": 9.784560143626571e-06,
662
- "loss": 0.5187,
663
  "step": 1090
664
  },
665
  {
666
  "epoch": 0.99,
667
  "learning_rate": 9.874326750448834e-06,
668
- "loss": 0.4591,
669
  "step": 1100
670
  },
671
  {
672
  "epoch": 1.0,
673
  "learning_rate": 9.964093357271095e-06,
674
- "loss": 0.5344,
675
  "step": 1110
676
  },
677
  {
678
  "epoch": 1.0,
679
  "eval_accuracy": {
680
- "accuracy": 0.8744113029827315
681
  },
682
  "eval_f1": {
683
- "f1": 0.8645201833830978
684
  },
685
- "eval_loss": 0.40481075644493103,
686
  "eval_precision": {
687
- "precision": 0.8668175457367389
688
  },
689
  "eval_recall": {
690
- "recall": 0.8631211355155497
691
  },
692
- "eval_runtime": 243.6123,
693
- "eval_samples_per_second": 73.215,
694
- "eval_steps_per_second": 4.577,
695
  "step": 1114
696
  },
697
  {
698
  "epoch": 1.0,
699
  "learning_rate": 1.0053859964093358e-05,
700
- "loss": 0.5092,
701
  "step": 1120
702
  },
703
  {
704
  "epoch": 1.01,
705
  "learning_rate": 1.0143626570915619e-05,
706
- "loss": 0.4834,
707
  "step": 1130
708
  },
709
  {
710
  "epoch": 1.02,
711
  "learning_rate": 1.0233393177737882e-05,
712
- "loss": 0.5403,
713
  "step": 1140
714
  },
715
  {
716
  "epoch": 1.03,
717
  "learning_rate": 1.0323159784560143e-05,
718
- "loss": 0.5109,
719
  "step": 1150
720
  },
721
  {
722
  "epoch": 1.04,
723
  "learning_rate": 1.0412926391382406e-05,
724
- "loss": 0.5002,
725
  "step": 1160
726
  },
727
  {
728
  "epoch": 1.05,
729
  "learning_rate": 1.0502692998204669e-05,
730
- "loss": 0.5052,
731
  "step": 1170
732
  },
733
  {
734
  "epoch": 1.06,
735
  "learning_rate": 1.059245960502693e-05,
736
- "loss": 0.4642,
737
  "step": 1180
738
  },
739
  {
740
  "epoch": 1.07,
741
  "learning_rate": 1.0682226211849193e-05,
742
- "loss": 0.4479,
743
  "step": 1190
744
  },
745
  {
746
  "epoch": 1.08,
747
  "learning_rate": 1.0771992818671454e-05,
748
- "loss": 0.4944,
749
  "step": 1200
750
  },
751
  {
752
  "epoch": 1.09,
753
  "learning_rate": 1.0861759425493717e-05,
754
- "loss": 0.4583,
755
  "step": 1210
756
  },
757
  {
758
  "epoch": 1.09,
759
  "learning_rate": 1.0951526032315979e-05,
760
- "loss": 0.4779,
761
  "step": 1220
762
  },
763
  {
764
  "epoch": 1.1,
765
  "learning_rate": 1.1041292639138241e-05,
766
- "loss": 0.5038,
767
  "step": 1230
768
  },
769
  {
770
  "epoch": 1.11,
771
  "learning_rate": 1.1131059245960503e-05,
772
- "loss": 0.4831,
773
  "step": 1240
774
  },
775
  {
776
  "epoch": 1.12,
777
  "learning_rate": 1.1220825852782766e-05,
778
- "loss": 0.4999,
779
  "step": 1250
780
  },
781
  {
782
  "epoch": 1.13,
783
  "learning_rate": 1.1310592459605028e-05,
784
- "loss": 0.4611,
785
  "step": 1260
786
  },
787
  {
788
  "epoch": 1.14,
789
  "learning_rate": 1.140035906642729e-05,
790
- "loss": 0.4775,
791
  "step": 1270
792
  },
793
  {
794
  "epoch": 1.15,
795
  "learning_rate": 1.1490125673249553e-05,
796
- "loss": 0.4388,
797
  "step": 1280
798
  },
799
  {
800
  "epoch": 1.16,
801
  "learning_rate": 1.1579892280071814e-05,
802
- "loss": 0.4374,
803
  "step": 1290
804
  },
805
  {
806
  "epoch": 1.17,
807
  "learning_rate": 1.1669658886894077e-05,
808
- "loss": 0.4608,
809
  "step": 1300
810
  },
811
  {
812
  "epoch": 1.18,
813
  "learning_rate": 1.1759425493716338e-05,
814
- "loss": 0.4973,
815
  "step": 1310
816
  },
817
  {
818
  "epoch": 1.18,
819
  "learning_rate": 1.1849192100538601e-05,
820
- "loss": 0.4387,
821
  "step": 1320
822
  },
823
  {
824
  "epoch": 1.19,
825
  "learning_rate": 1.1938958707360862e-05,
826
- "loss": 0.4617,
827
  "step": 1330
828
  },
829
  {
830
  "epoch": 1.2,
831
  "learning_rate": 1.2028725314183125e-05,
832
- "loss": 0.4631,
833
  "step": 1340
834
  },
835
  {
836
  "epoch": 1.21,
837
  "learning_rate": 1.2118491921005388e-05,
838
- "loss": 0.4869,
839
  "step": 1350
840
  },
841
  {
842
  "epoch": 1.22,
843
  "learning_rate": 1.2208258527827649e-05,
844
- "loss": 0.4699,
845
  "step": 1360
846
  },
847
  {
848
  "epoch": 1.23,
849
  "learning_rate": 1.2298025134649912e-05,
850
- "loss": 0.482,
851
  "step": 1370
852
  },
853
  {
854
  "epoch": 1.24,
855
  "learning_rate": 1.2387791741472173e-05,
856
- "loss": 0.4067,
857
  "step": 1380
858
  },
859
  {
860
  "epoch": 1.25,
861
  "learning_rate": 1.2477558348294434e-05,
862
- "loss": 0.4218,
863
  "step": 1390
864
  },
865
  {
866
  "epoch": 1.26,
867
  "learning_rate": 1.2567324955116697e-05,
868
- "loss": 0.4643,
869
  "step": 1400
870
  },
871
  {
872
  "epoch": 1.26,
873
  "learning_rate": 1.2657091561938959e-05,
874
- "loss": 0.4317,
875
  "step": 1410
876
  },
877
  {
878
  "epoch": 1.27,
879
  "learning_rate": 1.2746858168761221e-05,
880
- "loss": 0.4303,
881
  "step": 1420
882
  },
883
  {
884
  "epoch": 1.28,
885
  "learning_rate": 1.2836624775583483e-05,
886
- "loss": 0.4247,
887
  "step": 1430
888
  },
889
  {
890
  "epoch": 1.29,
891
  "learning_rate": 1.2926391382405746e-05,
892
- "loss": 0.4553,
893
  "step": 1440
894
  },
895
  {
896
  "epoch": 1.3,
897
  "learning_rate": 1.3016157989228009e-05,
898
- "loss": 0.4527,
899
  "step": 1450
900
  },
901
  {
902
  "epoch": 1.31,
903
  "learning_rate": 1.310592459605027e-05,
904
- "loss": 0.4216,
905
  "step": 1460
906
  },
907
  {
908
  "epoch": 1.32,
909
  "learning_rate": 1.3195691202872531e-05,
910
- "loss": 0.4481,
911
  "step": 1470
912
  },
913
  {
914
  "epoch": 1.33,
915
  "learning_rate": 1.3285457809694792e-05,
916
- "loss": 0.3926,
917
  "step": 1480
918
  },
919
  {
920
  "epoch": 1.34,
921
  "learning_rate": 1.3375224416517057e-05,
922
- "loss": 0.4644,
923
  "step": 1490
924
  },
925
  {
926
  "epoch": 1.35,
927
  "learning_rate": 1.3464991023339318e-05,
928
- "loss": 0.4156,
929
  "step": 1500
930
  },
931
  {
932
  "epoch": 1.35,
933
  "learning_rate": 1.355475763016158e-05,
934
- "loss": 0.4165,
935
  "step": 1510
936
  },
937
  {
938
  "epoch": 1.36,
939
  "learning_rate": 1.3644524236983844e-05,
940
- "loss": 0.427,
941
  "step": 1520
942
  },
943
  {
944
  "epoch": 1.37,
945
  "learning_rate": 1.3734290843806105e-05,
946
- "loss": 0.4229,
947
  "step": 1530
948
  },
949
  {
950
  "epoch": 1.38,
951
  "learning_rate": 1.3824057450628366e-05,
952
- "loss": 0.3961,
953
  "step": 1540
954
  },
955
  {
956
  "epoch": 1.39,
957
  "learning_rate": 1.3913824057450627e-05,
958
- "loss": 0.4438,
959
  "step": 1550
960
  },
961
  {
962
  "epoch": 1.4,
963
  "learning_rate": 1.4003590664272892e-05,
964
- "loss": 0.4037,
965
  "step": 1560
966
  },
967
  {
968
  "epoch": 1.41,
969
  "learning_rate": 1.4093357271095153e-05,
970
- "loss": 0.4341,
971
  "step": 1570
972
  },
973
  {
974
  "epoch": 1.42,
975
  "learning_rate": 1.4183123877917415e-05,
976
- "loss": 0.3715,
977
  "step": 1580
978
  },
979
  {
980
  "epoch": 1.43,
981
  "learning_rate": 1.4272890484739679e-05,
982
- "loss": 0.4292,
983
  "step": 1590
984
  },
985
  {
986
  "epoch": 1.44,
987
  "learning_rate": 1.436265709156194e-05,
988
- "loss": 0.4539,
989
  "step": 1600
990
  },
991
  {
992
  "epoch": 1.44,
993
  "learning_rate": 1.4452423698384202e-05,
994
- "loss": 0.409,
995
  "step": 1610
996
  },
997
  {
998
  "epoch": 1.45,
999
  "learning_rate": 1.4542190305206463e-05,
1000
- "loss": 0.4473,
1001
  "step": 1620
1002
  },
1003
  {
1004
  "epoch": 1.46,
1005
  "learning_rate": 1.4631956912028727e-05,
1006
- "loss": 0.4202,
1007
  "step": 1630
1008
  },
1009
  {
1010
  "epoch": 1.47,
1011
  "learning_rate": 1.4721723518850989e-05,
1012
- "loss": 0.3701,
1013
  "step": 1640
1014
  },
1015
  {
1016
  "epoch": 1.48,
1017
  "learning_rate": 1.481149012567325e-05,
1018
- "loss": 0.4451,
1019
  "step": 1650
1020
  },
1021
  {
1022
  "epoch": 1.49,
1023
  "learning_rate": 1.4901256732495511e-05,
1024
- "loss": 0.4216,
1025
  "step": 1660
1026
  },
1027
  {
1028
  "epoch": 1.5,
1029
  "learning_rate": 1.4991023339317776e-05,
1030
- "loss": 0.4116,
1031
  "step": 1670
1032
  },
1033
  {
1034
  "epoch": 1.51,
1035
  "learning_rate": 1.5080789946140037e-05,
1036
- "loss": 0.4006,
1037
  "step": 1680
1038
  },
1039
  {
1040
  "epoch": 1.52,
1041
  "learning_rate": 1.5170556552962298e-05,
1042
- "loss": 0.4303,
1043
  "step": 1690
1044
  },
1045
  {
1046
  "epoch": 1.53,
1047
  "learning_rate": 1.5260323159784563e-05,
1048
- "loss": 0.441,
1049
  "step": 1700
1050
  },
1051
  {
1052
  "epoch": 1.53,
1053
  "learning_rate": 1.5350089766606824e-05,
1054
- "loss": 0.4248,
1055
  "step": 1710
1056
  },
1057
  {
1058
  "epoch": 1.54,
1059
  "learning_rate": 1.5439856373429085e-05,
1060
- "loss": 0.3771,
1061
  "step": 1720
1062
  },
1063
  {
1064
  "epoch": 1.55,
1065
  "learning_rate": 1.5529622980251346e-05,
1066
- "loss": 0.4158,
1067
  "step": 1730
1068
  },
1069
  {
1070
  "epoch": 1.56,
1071
  "learning_rate": 1.561938958707361e-05,
1072
- "loss": 0.3815,
1073
  "step": 1740
1074
  },
1075
  {
1076
  "epoch": 1.57,
1077
  "learning_rate": 1.5709156193895872e-05,
1078
- "loss": 0.4204,
1079
  "step": 1750
1080
  },
1081
  {
1082
  "epoch": 1.58,
1083
  "learning_rate": 1.5798922800718133e-05,
1084
- "loss": 0.4886,
1085
  "step": 1760
1086
  },
1087
  {
1088
  "epoch": 1.59,
1089
  "learning_rate": 1.5888689407540398e-05,
1090
- "loss": 0.4382,
1091
  "step": 1770
1092
  },
1093
  {
1094
  "epoch": 1.6,
1095
  "learning_rate": 1.597845601436266e-05,
1096
- "loss": 0.4502,
1097
  "step": 1780
1098
  },
1099
  {
1100
  "epoch": 1.61,
1101
  "learning_rate": 1.606822262118492e-05,
1102
- "loss": 0.4155,
1103
  "step": 1790
1104
  },
1105
  {
1106
  "epoch": 1.61,
1107
  "learning_rate": 1.615798922800718e-05,
1108
- "loss": 0.3801,
1109
  "step": 1800
1110
  },
1111
  {
1112
  "epoch": 1.62,
1113
  "learning_rate": 1.6247755834829446e-05,
1114
- "loss": 0.3968,
1115
  "step": 1810
1116
  },
1117
  {
1118
  "epoch": 1.63,
1119
  "learning_rate": 1.6337522441651707e-05,
1120
- "loss": 0.365,
1121
  "step": 1820
1122
  },
1123
  {
1124
  "epoch": 1.64,
1125
  "learning_rate": 1.642728904847397e-05,
1126
- "loss": 0.3638,
1127
  "step": 1830
1128
  },
1129
  {
1130
  "epoch": 1.65,
1131
  "learning_rate": 1.6517055655296233e-05,
1132
- "loss": 0.3935,
1133
  "step": 1840
1134
  },
1135
  {
1136
  "epoch": 1.66,
1137
  "learning_rate": 1.6606822262118494e-05,
1138
- "loss": 0.4092,
1139
  "step": 1850
1140
  },
1141
  {
1142
  "epoch": 1.67,
1143
  "learning_rate": 1.6696588868940756e-05,
1144
- "loss": 0.3617,
1145
  "step": 1860
1146
  },
1147
  {
1148
  "epoch": 1.68,
1149
  "learning_rate": 1.6786355475763017e-05,
1150
- "loss": 0.389,
1151
  "step": 1870
1152
  },
1153
  {
1154
  "epoch": 1.69,
1155
  "learning_rate": 1.687612208258528e-05,
1156
- "loss": 0.3357,
1157
  "step": 1880
1158
  },
1159
  {
1160
  "epoch": 1.7,
1161
  "learning_rate": 1.6965888689407543e-05,
1162
- "loss": 0.3925,
1163
  "step": 1890
1164
  },
1165
  {
1166
  "epoch": 1.7,
1167
  "learning_rate": 1.7055655296229804e-05,
1168
- "loss": 0.4186,
1169
  "step": 1900
1170
  },
1171
  {
1172
  "epoch": 1.71,
1173
  "learning_rate": 1.7145421903052065e-05,
1174
- "loss": 0.3913,
1175
  "step": 1910
1176
  },
1177
  {
1178
  "epoch": 1.72,
1179
  "learning_rate": 1.723518850987433e-05,
1180
- "loss": 0.3679,
1181
  "step": 1920
1182
  },
1183
  {
1184
  "epoch": 1.73,
1185
  "learning_rate": 1.732495511669659e-05,
1186
- "loss": 0.4476,
1187
  "step": 1930
1188
  },
1189
  {
1190
  "epoch": 1.74,
1191
  "learning_rate": 1.7414721723518852e-05,
1192
- "loss": 0.4065,
1193
  "step": 1940
1194
  },
1195
  {
1196
  "epoch": 1.75,
1197
  "learning_rate": 1.7504488330341113e-05,
1198
- "loss": 0.4079,
1199
  "step": 1950
1200
  },
1201
  {
1202
  "epoch": 1.76,
1203
  "learning_rate": 1.7594254937163378e-05,
1204
- "loss": 0.3831,
1205
  "step": 1960
1206
  },
1207
  {
1208
  "epoch": 1.77,
1209
  "learning_rate": 1.768402154398564e-05,
1210
- "loss": 0.3985,
1211
  "step": 1970
1212
  },
1213
  {
1214
  "epoch": 1.78,
1215
  "learning_rate": 1.77737881508079e-05,
1216
- "loss": 0.3705,
1217
  "step": 1980
1218
  },
1219
  {
1220
  "epoch": 1.79,
1221
  "learning_rate": 1.786355475763016e-05,
1222
- "loss": 0.3742,
1223
  "step": 1990
1224
  },
1225
  {
1226
  "epoch": 1.79,
1227
  "learning_rate": 1.7953321364452423e-05,
1228
- "loss": 0.3517,
1229
  "step": 2000
1230
  },
1231
  {
1232
  "epoch": 1.8,
1233
  "learning_rate": 1.8043087971274687e-05,
1234
- "loss": 0.3871,
1235
  "step": 2010
1236
  },
1237
  {
1238
  "epoch": 1.81,
1239
  "learning_rate": 1.813285457809695e-05,
1240
- "loss": 0.3416,
1241
  "step": 2020
1242
  },
1243
  {
1244
  "epoch": 1.82,
1245
  "learning_rate": 1.822262118491921e-05,
1246
- "loss": 0.3856,
1247
  "step": 2030
1248
  },
1249
  {
1250
  "epoch": 1.83,
1251
  "learning_rate": 1.831238779174147e-05,
1252
- "loss": 0.4245,
1253
  "step": 2040
1254
  },
1255
  {
1256
  "epoch": 1.84,
1257
  "learning_rate": 1.8402154398563732e-05,
1258
- "loss": 0.3645,
1259
  "step": 2050
1260
  },
1261
  {
1262
  "epoch": 1.85,
1263
  "learning_rate": 1.8491921005385997e-05,
1264
- "loss": 0.3505,
1265
  "step": 2060
1266
  },
1267
  {
1268
  "epoch": 1.86,
1269
  "learning_rate": 1.8581687612208258e-05,
1270
- "loss": 0.3746,
1271
  "step": 2070
1272
  },
1273
  {
1274
  "epoch": 1.87,
1275
  "learning_rate": 1.867145421903052e-05,
1276
- "loss": 0.352,
1277
  "step": 2080
1278
  },
1279
  {
1280
  "epoch": 1.87,
1281
  "learning_rate": 1.8761220825852784e-05,
1282
- "loss": 0.4295,
1283
  "step": 2090
1284
  },
1285
  {
1286
  "epoch": 1.88,
1287
  "learning_rate": 1.8850987432675045e-05,
1288
- "loss": 0.387,
1289
  "step": 2100
1290
  },
1291
  {
1292
  "epoch": 1.89,
1293
  "learning_rate": 1.8940754039497306e-05,
1294
- "loss": 0.4056,
1295
  "step": 2110
1296
  },
1297
  {
1298
  "epoch": 1.9,
1299
  "learning_rate": 1.9030520646319568e-05,
1300
- "loss": 0.3913,
1301
  "step": 2120
1302
  },
1303
  {
1304
  "epoch": 1.91,
1305
  "learning_rate": 1.9120287253141832e-05,
1306
- "loss": 0.3789,
1307
  "step": 2130
1308
  },
1309
  {
1310
  "epoch": 1.92,
1311
  "learning_rate": 1.9210053859964093e-05,
1312
- "loss": 0.3688,
1313
  "step": 2140
1314
  },
1315
  {
1316
  "epoch": 1.93,
1317
  "learning_rate": 1.9299820466786355e-05,
1318
- "loss": 0.3499,
1319
  "step": 2150
1320
  },
1321
  {
1322
  "epoch": 1.94,
1323
  "learning_rate": 1.9389587073608616e-05,
1324
- "loss": 0.3153,
1325
  "step": 2160
1326
  },
1327
  {
1328
  "epoch": 1.95,
1329
  "learning_rate": 1.947935368043088e-05,
1330
- "loss": 0.3558,
1331
  "step": 2170
1332
  },
1333
  {
1334
  "epoch": 1.96,
1335
  "learning_rate": 1.9569120287253142e-05,
1336
- "loss": 0.3001,
1337
  "step": 2180
1338
  },
1339
  {
1340
  "epoch": 1.96,
1341
  "learning_rate": 1.9658886894075403e-05,
1342
- "loss": 0.3109,
1343
  "step": 2190
1344
  },
1345
  {
1346
  "epoch": 1.97,
1347
  "learning_rate": 1.9748653500897668e-05,
1348
- "loss": 0.3377,
1349
  "step": 2200
1350
  },
1351
  {
1352
  "epoch": 1.98,
1353
  "learning_rate": 1.983842010771993e-05,
1354
- "loss": 0.3888,
1355
  "step": 2210
1356
  },
1357
  {
1358
  "epoch": 1.99,
1359
  "learning_rate": 1.992818671454219e-05,
1360
- "loss": 0.3536,
1361
  "step": 2220
1362
  },
1363
  {
1364
  "epoch": 2.0,
1365
  "eval_accuracy": {
1366
- "accuracy": 0.9219555954249832
1367
  },
1368
  "eval_f1": {
1369
- "f1": 0.9164276462698699
1370
  },
1371
- "eval_loss": 0.2440667599439621,
1372
  "eval_precision": {
1373
- "precision": 0.9196643633917082
1374
  },
1375
  "eval_recall": {
1376
- "recall": 0.913748377704386
1377
  },
1378
- "eval_runtime": 164.5475,
1379
- "eval_samples_per_second": 108.394,
1380
- "eval_steps_per_second": 6.776,
1381
  "step": 2229
1382
  }
1383
  ],
 
1
  {
2
+ "best_metric": 0.2492757886648178,
3
  "best_model_checkpoint": "vit-base-patch16-224-in21k-crack-detectorVITmain50epochs\\checkpoint-2229",
4
  "epoch": 1.9995514689392242,
5
  "eval_steps": 500,
 
11
  {
12
  "epoch": 0.01,
13
  "learning_rate": 8.976660682226213e-08,
14
+ "loss": 1.3961,
15
  "step": 10
16
  },
17
  {
18
  "epoch": 0.02,
19
  "learning_rate": 1.7953321364452426e-07,
20
+ "loss": 1.395,
21
  "step": 20
22
  },
23
  {
24
  "epoch": 0.03,
25
  "learning_rate": 2.692998204667864e-07,
26
+ "loss": 1.3978,
27
  "step": 30
28
  },
29
  {
30
  "epoch": 0.04,
31
  "learning_rate": 3.590664272890485e-07,
32
+ "loss": 1.3963,
33
  "step": 40
34
  },
35
  {
36
  "epoch": 0.04,
37
  "learning_rate": 4.4883303411131064e-07,
38
+ "loss": 1.3907,
39
  "step": 50
40
  },
41
  {
42
  "epoch": 0.05,
43
  "learning_rate": 5.385996409335728e-07,
44
+ "loss": 1.396,
45
  "step": 60
46
  },
47
  {
48
  "epoch": 0.06,
49
  "learning_rate": 6.283662477558349e-07,
50
+ "loss": 1.3885,
51
  "step": 70
52
  },
53
  {
54
  "epoch": 0.07,
55
  "learning_rate": 7.18132854578097e-07,
56
+ "loss": 1.387,
57
  "step": 80
58
  },
59
  {
60
  "epoch": 0.08,
61
  "learning_rate": 8.078994614003591e-07,
62
+ "loss": 1.3894,
63
  "step": 90
64
  },
65
  {
66
  "epoch": 0.09,
67
  "learning_rate": 8.976660682226213e-07,
68
+ "loss": 1.3806,
69
  "step": 100
70
  },
71
  {
72
  "epoch": 0.1,
73
  "learning_rate": 9.874326750448833e-07,
74
+ "loss": 1.383,
75
  "step": 110
76
  },
77
  {
78
  "epoch": 0.11,
79
  "learning_rate": 1.0771992818671456e-06,
80
+ "loss": 1.3764,
81
  "step": 120
82
  },
83
  {
84
  "epoch": 0.12,
85
  "learning_rate": 1.1669658886894075e-06,
86
+ "loss": 1.3688,
87
  "step": 130
88
  },
89
  {
90
  "epoch": 0.13,
91
  "learning_rate": 1.2567324955116697e-06,
92
+ "loss": 1.3708,
93
  "step": 140
94
  },
95
  {
96
  "epoch": 0.13,
97
  "learning_rate": 1.3464991023339318e-06,
98
+ "loss": 1.366,
99
  "step": 150
100
  },
101
  {
102
  "epoch": 0.14,
103
  "learning_rate": 1.436265709156194e-06,
104
+ "loss": 1.371,
105
  "step": 160
106
  },
107
  {
108
  "epoch": 0.15,
109
  "learning_rate": 1.5260323159784561e-06,
110
+ "loss": 1.3558,
111
  "step": 170
112
  },
113
  {
114
  "epoch": 0.16,
115
  "learning_rate": 1.6157989228007182e-06,
116
+ "loss": 1.3584,
117
  "step": 180
118
  },
119
  {
120
  "epoch": 0.17,
121
  "learning_rate": 1.7055655296229805e-06,
122
+ "loss": 1.3409,
123
  "step": 190
124
  },
125
  {
126
  "epoch": 0.18,
127
  "learning_rate": 1.7953321364452425e-06,
128
+ "loss": 1.346,
129
  "step": 200
130
  },
131
  {
132
  "epoch": 0.19,
133
  "learning_rate": 1.8850987432675046e-06,
134
+ "loss": 1.3355,
135
  "step": 210
136
  },
137
  {
138
  "epoch": 0.2,
139
  "learning_rate": 1.9748653500897667e-06,
140
+ "loss": 1.3323,
141
  "step": 220
142
  },
143
  {
144
  "epoch": 0.21,
145
  "learning_rate": 2.064631956912029e-06,
146
+ "loss": 1.3231,
147
  "step": 230
148
  },
149
  {
150
  "epoch": 0.22,
151
  "learning_rate": 2.1543985637342912e-06,
152
+ "loss": 1.3129,
153
  "step": 240
154
  },
155
  {
156
  "epoch": 0.22,
157
  "learning_rate": 2.244165170556553e-06,
158
+ "loss": 1.3178,
159
  "step": 250
160
  },
161
  {
162
  "epoch": 0.23,
163
  "learning_rate": 2.333931777378815e-06,
164
+ "loss": 1.2953,
165
  "step": 260
166
  },
167
  {
168
  "epoch": 0.24,
169
  "learning_rate": 2.423698384201077e-06,
170
+ "loss": 1.2938,
171
  "step": 270
172
  },
173
  {
174
  "epoch": 0.25,
175
  "learning_rate": 2.5134649910233395e-06,
176
+ "loss": 1.2849,
177
  "step": 280
178
  },
179
  {
180
  "epoch": 0.26,
181
  "learning_rate": 2.6032315978456015e-06,
182
+ "loss": 1.2813,
183
  "step": 290
184
  },
185
  {
186
  "epoch": 0.27,
187
  "learning_rate": 2.6929982046678636e-06,
188
+ "loss": 1.2811,
189
  "step": 300
190
  },
191
  {
192
  "epoch": 0.28,
193
  "learning_rate": 2.7827648114901257e-06,
194
+ "loss": 1.2526,
195
  "step": 310
196
  },
197
  {
198
  "epoch": 0.29,
199
  "learning_rate": 2.872531418312388e-06,
200
+ "loss": 1.2438,
201
  "step": 320
202
  },
203
  {
204
  "epoch": 0.3,
205
  "learning_rate": 2.9622980251346502e-06,
206
+ "loss": 1.2145,
207
  "step": 330
208
  },
209
  {
210
  "epoch": 0.31,
211
  "learning_rate": 3.0520646319569123e-06,
212
+ "loss": 1.2146,
213
  "step": 340
214
  },
215
  {
216
  "epoch": 0.31,
217
  "learning_rate": 3.1418312387791743e-06,
218
+ "loss": 1.1883,
219
  "step": 350
220
  },
221
  {
222
  "epoch": 0.32,
223
  "learning_rate": 3.2315978456014364e-06,
224
+ "loss": 1.1891,
225
  "step": 360
226
  },
227
  {
228
  "epoch": 0.33,
229
  "learning_rate": 3.321364452423698e-06,
230
+ "loss": 1.1723,
231
  "step": 370
232
  },
233
  {
234
  "epoch": 0.34,
235
  "learning_rate": 3.411131059245961e-06,
236
+ "loss": 1.1417,
237
  "step": 380
238
  },
239
  {
240
  "epoch": 0.35,
241
  "learning_rate": 3.500897666068223e-06,
242
+ "loss": 1.1338,
243
  "step": 390
244
  },
245
  {
246
  "epoch": 0.36,
247
  "learning_rate": 3.590664272890485e-06,
248
+ "loss": 1.1004,
249
  "step": 400
250
  },
251
  {
252
  "epoch": 0.37,
253
  "learning_rate": 3.680430879712747e-06,
254
+ "loss": 1.0873,
255
  "step": 410
256
  },
257
  {
258
  "epoch": 0.38,
259
  "learning_rate": 3.770197486535009e-06,
260
+ "loss": 1.0358,
261
  "step": 420
262
  },
263
  {
264
  "epoch": 0.39,
265
  "learning_rate": 3.859964093357271e-06,
266
+ "loss": 1.0517,
267
  "step": 430
268
  },
269
  {
270
  "epoch": 0.39,
271
  "learning_rate": 3.949730700179533e-06,
272
+ "loss": 1.0139,
273
  "step": 440
274
  },
275
  {
276
  "epoch": 0.4,
277
  "learning_rate": 4.039497307001795e-06,
278
+ "loss": 1.0294,
279
  "step": 450
280
  },
281
  {
282
  "epoch": 0.41,
283
  "learning_rate": 4.129263913824058e-06,
284
+ "loss": 1.0171,
285
  "step": 460
286
  },
287
  {
288
  "epoch": 0.42,
289
  "learning_rate": 4.21903052064632e-06,
290
+ "loss": 0.9827,
291
  "step": 470
292
  },
293
  {
294
  "epoch": 0.43,
295
  "learning_rate": 4.3087971274685824e-06,
296
+ "loss": 0.9382,
297
  "step": 480
298
  },
299
  {
300
  "epoch": 0.44,
301
  "learning_rate": 4.3985637342908445e-06,
302
+ "loss": 0.9145,
303
  "step": 490
304
  },
305
  {
306
  "epoch": 0.45,
307
  "learning_rate": 4.488330341113106e-06,
308
+ "loss": 0.9276,
309
  "step": 500
310
  },
311
  {
312
  "epoch": 0.46,
313
  "learning_rate": 4.578096947935368e-06,
314
+ "loss": 0.8801,
315
  "step": 510
316
  },
317
  {
318
  "epoch": 0.47,
319
  "learning_rate": 4.66786355475763e-06,
320
+ "loss": 0.8906,
321
  "step": 520
322
  },
323
  {
324
  "epoch": 0.48,
325
  "learning_rate": 4.757630161579892e-06,
326
+ "loss": 0.9025,
327
  "step": 530
328
  },
329
  {
330
  "epoch": 0.48,
331
  "learning_rate": 4.847396768402154e-06,
332
+ "loss": 0.8621,
333
  "step": 540
334
  },
335
  {
336
  "epoch": 0.49,
337
  "learning_rate": 4.937163375224417e-06,
338
+ "loss": 0.8653,
339
  "step": 550
340
  },
341
  {
342
  "epoch": 0.5,
343
  "learning_rate": 5.026929982046679e-06,
344
+ "loss": 0.8292,
345
  "step": 560
346
  },
347
  {
348
  "epoch": 0.51,
349
  "learning_rate": 5.116696588868941e-06,
350
+ "loss": 0.8195,
351
  "step": 570
352
  },
353
  {
354
  "epoch": 0.52,
355
  "learning_rate": 5.206463195691203e-06,
356
+ "loss": 0.8026,
357
  "step": 580
358
  },
359
  {
360
  "epoch": 0.53,
361
  "learning_rate": 5.296229802513465e-06,
362
+ "loss": 0.841,
363
  "step": 590
364
  },
365
  {
366
  "epoch": 0.54,
367
  "learning_rate": 5.385996409335727e-06,
368
+ "loss": 0.778,
369
  "step": 600
370
  },
371
  {
372
  "epoch": 0.55,
373
  "learning_rate": 5.475763016157989e-06,
374
+ "loss": 0.7706,
375
  "step": 610
376
  },
377
  {
378
  "epoch": 0.56,
379
  "learning_rate": 5.565529622980251e-06,
380
+ "loss": 0.733,
381
  "step": 620
382
  },
383
  {
384
  "epoch": 0.57,
385
  "learning_rate": 5.655296229802514e-06,
386
+ "loss": 0.7437,
387
  "step": 630
388
  },
389
  {
390
  "epoch": 0.57,
391
  "learning_rate": 5.745062836624776e-06,
392
+ "loss": 0.7644,
393
  "step": 640
394
  },
395
  {
396
  "epoch": 0.58,
397
  "learning_rate": 5.834829443447038e-06,
398
+ "loss": 0.7125,
399
  "step": 650
400
  },
401
  {
402
  "epoch": 0.59,
403
  "learning_rate": 5.9245960502693004e-06,
404
+ "loss": 0.7146,
405
  "step": 660
406
  },
407
  {
408
  "epoch": 0.6,
409
  "learning_rate": 6.0143626570915625e-06,
410
+ "loss": 0.7201,
411
  "step": 670
412
  },
413
  {
414
  "epoch": 0.61,
415
  "learning_rate": 6.1041292639138246e-06,
416
+ "loss": 0.6851,
417
  "step": 680
418
  },
419
  {
420
  "epoch": 0.62,
421
  "learning_rate": 6.193895870736087e-06,
422
+ "loss": 0.6417,
423
  "step": 690
424
  },
425
  {
426
  "epoch": 0.63,
427
  "learning_rate": 6.283662477558349e-06,
428
+ "loss": 0.6656,
429
  "step": 700
430
  },
431
  {
432
  "epoch": 0.64,
433
  "learning_rate": 6.373429084380611e-06,
434
+ "loss": 0.6122,
435
  "step": 710
436
  },
437
  {
438
  "epoch": 0.65,
439
  "learning_rate": 6.463195691202873e-06,
440
+ "loss": 0.6536,
441
  "step": 720
442
  },
443
  {
444
  "epoch": 0.65,
445
  "learning_rate": 6.552962298025135e-06,
446
+ "loss": 0.6315,
447
  "step": 730
448
  },
449
  {
450
  "epoch": 0.66,
451
  "learning_rate": 6.642728904847396e-06,
452
+ "loss": 0.6618,
453
  "step": 740
454
  },
455
  {
456
  "epoch": 0.67,
457
  "learning_rate": 6.732495511669659e-06,
458
+ "loss": 0.6346,
459
  "step": 750
460
  },
461
  {
462
  "epoch": 0.68,
463
  "learning_rate": 6.822262118491922e-06,
464
+ "loss": 0.6866,
465
  "step": 760
466
  },
467
  {
468
  "epoch": 0.69,
469
  "learning_rate": 6.912028725314183e-06,
470
+ "loss": 0.6093,
471
  "step": 770
472
  },
473
  {
474
  "epoch": 0.7,
475
  "learning_rate": 7.001795332136446e-06,
476
+ "loss": 0.6116,
477
  "step": 780
478
  },
479
  {
480
  "epoch": 0.71,
481
  "learning_rate": 7.091561938958707e-06,
482
+ "loss": 0.602,
483
  "step": 790
484
  },
485
  {
486
  "epoch": 0.72,
487
  "learning_rate": 7.18132854578097e-06,
488
+ "loss": 0.6266,
489
  "step": 800
490
  },
491
  {
492
  "epoch": 0.73,
493
  "learning_rate": 7.271095152603231e-06,
494
+ "loss": 0.6082,
495
  "step": 810
496
  },
497
  {
498
  "epoch": 0.74,
499
  "learning_rate": 7.360861759425494e-06,
500
+ "loss": 0.6194,
501
  "step": 820
502
  },
503
  {
504
  "epoch": 0.74,
505
  "learning_rate": 7.4506283662477555e-06,
506
+ "loss": 0.6277,
507
  "step": 830
508
  },
509
  {
510
  "epoch": 0.75,
511
  "learning_rate": 7.540394973070018e-06,
512
+ "loss": 0.609,
513
  "step": 840
514
  },
515
  {
516
  "epoch": 0.76,
517
  "learning_rate": 7.630161579892281e-06,
518
+ "loss": 0.6252,
519
  "step": 850
520
  },
521
  {
522
  "epoch": 0.77,
523
  "learning_rate": 7.719928186714543e-06,
524
+ "loss": 0.5813,
525
  "step": 860
526
  },
527
  {
528
  "epoch": 0.78,
529
  "learning_rate": 7.809694793536805e-06,
530
+ "loss": 0.5799,
531
  "step": 870
532
  },
533
  {
534
  "epoch": 0.79,
535
  "learning_rate": 7.899461400359067e-06,
536
+ "loss": 0.6398,
537
  "step": 880
538
  },
539
  {
540
  "epoch": 0.8,
541
  "learning_rate": 7.98922800718133e-06,
542
+ "loss": 0.5549,
543
  "step": 890
544
  },
545
  {
546
  "epoch": 0.81,
547
  "learning_rate": 8.07899461400359e-06,
548
+ "loss": 0.6023,
549
  "step": 900
550
  },
551
  {
552
  "epoch": 0.82,
553
  "learning_rate": 8.168761220825854e-06,
554
+ "loss": 0.582,
555
  "step": 910
556
  },
557
  {
558
  "epoch": 0.83,
559
  "learning_rate": 8.258527827648117e-06,
560
+ "loss": 0.544,
561
  "step": 920
562
  },
563
  {
564
  "epoch": 0.83,
565
  "learning_rate": 8.348294434470378e-06,
566
+ "loss": 0.5912,
567
  "step": 930
568
  },
569
  {
570
  "epoch": 0.84,
571
  "learning_rate": 8.43806104129264e-06,
572
+ "loss": 0.5461,
573
  "step": 940
574
  },
575
  {
576
  "epoch": 0.85,
577
  "learning_rate": 8.527827648114902e-06,
578
+ "loss": 0.5238,
579
  "step": 950
580
  },
581
  {
582
  "epoch": 0.86,
583
  "learning_rate": 8.617594254937165e-06,
584
+ "loss": 0.5558,
585
  "step": 960
586
  },
587
  {
588
  "epoch": 0.87,
589
  "learning_rate": 8.707360861759426e-06,
590
+ "loss": 0.5371,
591
  "step": 970
592
  },
593
  {
594
  "epoch": 0.88,
595
  "learning_rate": 8.797127468581689e-06,
596
+ "loss": 0.5529,
597
  "step": 980
598
  },
599
  {
600
  "epoch": 0.89,
601
  "learning_rate": 8.88689407540395e-06,
602
+ "loss": 0.5691,
603
  "step": 990
604
  },
605
  {
606
  "epoch": 0.9,
607
  "learning_rate": 8.976660682226211e-06,
608
+ "loss": 0.5567,
609
  "step": 1000
610
  },
611
  {
612
  "epoch": 0.91,
613
  "learning_rate": 9.066427289048474e-06,
614
+ "loss": 0.5135,
615
  "step": 1010
616
  },
617
  {
618
  "epoch": 0.92,
619
  "learning_rate": 9.156193895870736e-06,
620
+ "loss": 0.5099,
621
  "step": 1020
622
  },
623
  {
624
  "epoch": 0.92,
625
  "learning_rate": 9.245960502692998e-06,
626
+ "loss": 0.5422,
627
  "step": 1030
628
  },
629
  {
630
  "epoch": 0.93,
631
  "learning_rate": 9.33572710951526e-06,
632
+ "loss": 0.5106,
633
  "step": 1040
634
  },
635
  {
636
  "epoch": 0.94,
637
  "learning_rate": 9.425493716337523e-06,
638
+ "loss": 0.4892,
639
  "step": 1050
640
  },
641
  {
642
  "epoch": 0.95,
643
  "learning_rate": 9.515260323159784e-06,
644
+ "loss": 0.4541,
645
  "step": 1060
646
  },
647
  {
648
  "epoch": 0.96,
649
  "learning_rate": 9.605026929982047e-06,
650
+ "loss": 0.4675,
651
  "step": 1070
652
  },
653
  {
654
  "epoch": 0.97,
655
  "learning_rate": 9.694793536804308e-06,
656
+ "loss": 0.5123,
657
  "step": 1080
658
  },
659
  {
660
  "epoch": 0.98,
661
  "learning_rate": 9.784560143626571e-06,
662
+ "loss": 0.5089,
663
  "step": 1090
664
  },
665
  {
666
  "epoch": 0.99,
667
  "learning_rate": 9.874326750448834e-06,
668
+ "loss": 0.5233,
669
  "step": 1100
670
  },
671
  {
672
  "epoch": 1.0,
673
  "learning_rate": 9.964093357271095e-06,
674
+ "loss": 0.5622,
675
  "step": 1110
676
  },
677
  {
678
  "epoch": 1.0,
679
  "eval_accuracy": {
680
+ "accuracy": 0.8736263736263736
681
  },
682
  "eval_f1": {
683
+ "f1": 0.8653360894930927
684
  },
685
+ "eval_loss": 0.4108576774597168,
686
  "eval_precision": {
687
+ "precision": 0.8669392826942903
688
  },
689
  "eval_recall": {
690
+ "recall": 0.8641606609285752
691
  },
692
+ "eval_runtime": 236.9507,
693
+ "eval_samples_per_second": 75.273,
694
+ "eval_steps_per_second": 4.706,
695
  "step": 1114
696
  },
697
  {
698
  "epoch": 1.0,
699
  "learning_rate": 1.0053859964093358e-05,
700
+ "loss": 0.4957,
701
  "step": 1120
702
  },
703
  {
704
  "epoch": 1.01,
705
  "learning_rate": 1.0143626570915619e-05,
706
+ "loss": 0.5729,
707
  "step": 1130
708
  },
709
  {
710
  "epoch": 1.02,
711
  "learning_rate": 1.0233393177737882e-05,
712
+ "loss": 0.4884,
713
  "step": 1140
714
  },
715
  {
716
  "epoch": 1.03,
717
  "learning_rate": 1.0323159784560143e-05,
718
+ "loss": 0.4744,
719
  "step": 1150
720
  },
721
  {
722
  "epoch": 1.04,
723
  "learning_rate": 1.0412926391382406e-05,
724
+ "loss": 0.4683,
725
  "step": 1160
726
  },
727
  {
728
  "epoch": 1.05,
729
  "learning_rate": 1.0502692998204669e-05,
730
+ "loss": 0.5,
731
  "step": 1170
732
  },
733
  {
734
  "epoch": 1.06,
735
  "learning_rate": 1.059245960502693e-05,
736
+ "loss": 0.4649,
737
  "step": 1180
738
  },
739
  {
740
  "epoch": 1.07,
741
  "learning_rate": 1.0682226211849193e-05,
742
+ "loss": 0.508,
743
  "step": 1190
744
  },
745
  {
746
  "epoch": 1.08,
747
  "learning_rate": 1.0771992818671454e-05,
748
+ "loss": 0.4898,
749
  "step": 1200
750
  },
751
  {
752
  "epoch": 1.09,
753
  "learning_rate": 1.0861759425493717e-05,
754
+ "loss": 0.4722,
755
  "step": 1210
756
  },
757
  {
758
  "epoch": 1.09,
759
  "learning_rate": 1.0951526032315979e-05,
760
+ "loss": 0.4814,
761
  "step": 1220
762
  },
763
  {
764
  "epoch": 1.1,
765
  "learning_rate": 1.1041292639138241e-05,
766
+ "loss": 0.4505,
767
  "step": 1230
768
  },
769
  {
770
  "epoch": 1.11,
771
  "learning_rate": 1.1131059245960503e-05,
772
+ "loss": 0.4505,
773
  "step": 1240
774
  },
775
  {
776
  "epoch": 1.12,
777
  "learning_rate": 1.1220825852782766e-05,
778
+ "loss": 0.4187,
779
  "step": 1250
780
  },
781
  {
782
  "epoch": 1.13,
783
  "learning_rate": 1.1310592459605028e-05,
784
+ "loss": 0.4603,
785
  "step": 1260
786
  },
787
  {
788
  "epoch": 1.14,
789
  "learning_rate": 1.140035906642729e-05,
790
+ "loss": 0.4721,
791
  "step": 1270
792
  },
793
  {
794
  "epoch": 1.15,
795
  "learning_rate": 1.1490125673249553e-05,
796
+ "loss": 0.4368,
797
  "step": 1280
798
  },
799
  {
800
  "epoch": 1.16,
801
  "learning_rate": 1.1579892280071814e-05,
802
+ "loss": 0.4722,
803
  "step": 1290
804
  },
805
  {
806
  "epoch": 1.17,
807
  "learning_rate": 1.1669658886894077e-05,
808
+ "loss": 0.4718,
809
  "step": 1300
810
  },
811
  {
812
  "epoch": 1.18,
813
  "learning_rate": 1.1759425493716338e-05,
814
+ "loss": 0.4899,
815
  "step": 1310
816
  },
817
  {
818
  "epoch": 1.18,
819
  "learning_rate": 1.1849192100538601e-05,
820
+ "loss": 0.4758,
821
  "step": 1320
822
  },
823
  {
824
  "epoch": 1.19,
825
  "learning_rate": 1.1938958707360862e-05,
826
+ "loss": 0.4523,
827
  "step": 1330
828
  },
829
  {
830
  "epoch": 1.2,
831
  "learning_rate": 1.2028725314183125e-05,
832
+ "loss": 0.485,
833
  "step": 1340
834
  },
835
  {
836
  "epoch": 1.21,
837
  "learning_rate": 1.2118491921005388e-05,
838
+ "loss": 0.4977,
839
  "step": 1350
840
  },
841
  {
842
  "epoch": 1.22,
843
  "learning_rate": 1.2208258527827649e-05,
844
+ "loss": 0.4305,
845
  "step": 1360
846
  },
847
  {
848
  "epoch": 1.23,
849
  "learning_rate": 1.2298025134649912e-05,
850
+ "loss": 0.4221,
851
  "step": 1370
852
  },
853
  {
854
  "epoch": 1.24,
855
  "learning_rate": 1.2387791741472173e-05,
856
+ "loss": 0.4975,
857
  "step": 1380
858
  },
859
  {
860
  "epoch": 1.25,
861
  "learning_rate": 1.2477558348294434e-05,
862
+ "loss": 0.4506,
863
  "step": 1390
864
  },
865
  {
866
  "epoch": 1.26,
867
  "learning_rate": 1.2567324955116697e-05,
868
+ "loss": 0.4326,
869
  "step": 1400
870
  },
871
  {
872
  "epoch": 1.26,
873
  "learning_rate": 1.2657091561938959e-05,
874
+ "loss": 0.4479,
875
  "step": 1410
876
  },
877
  {
878
  "epoch": 1.27,
879
  "learning_rate": 1.2746858168761221e-05,
880
+ "loss": 0.4468,
881
  "step": 1420
882
  },
883
  {
884
  "epoch": 1.28,
885
  "learning_rate": 1.2836624775583483e-05,
886
+ "loss": 0.402,
887
  "step": 1430
888
  },
889
  {
890
  "epoch": 1.29,
891
  "learning_rate": 1.2926391382405746e-05,
892
+ "loss": 0.4711,
893
  "step": 1440
894
  },
895
  {
896
  "epoch": 1.3,
897
  "learning_rate": 1.3016157989228009e-05,
898
+ "loss": 0.4686,
899
  "step": 1450
900
  },
901
  {
902
  "epoch": 1.31,
903
  "learning_rate": 1.310592459605027e-05,
904
+ "loss": 0.4639,
905
  "step": 1460
906
  },
907
  {
908
  "epoch": 1.32,
909
  "learning_rate": 1.3195691202872531e-05,
910
+ "loss": 0.435,
911
  "step": 1470
912
  },
913
  {
914
  "epoch": 1.33,
915
  "learning_rate": 1.3285457809694792e-05,
916
+ "loss": 0.3868,
917
  "step": 1480
918
  },
919
  {
920
  "epoch": 1.34,
921
  "learning_rate": 1.3375224416517057e-05,
922
+ "loss": 0.4303,
923
  "step": 1490
924
  },
925
  {
926
  "epoch": 1.35,
927
  "learning_rate": 1.3464991023339318e-05,
928
+ "loss": 0.432,
929
  "step": 1500
930
  },
931
  {
932
  "epoch": 1.35,
933
  "learning_rate": 1.355475763016158e-05,
934
+ "loss": 0.4206,
935
  "step": 1510
936
  },
937
  {
938
  "epoch": 1.36,
939
  "learning_rate": 1.3644524236983844e-05,
940
+ "loss": 0.4282,
941
  "step": 1520
942
  },
943
  {
944
  "epoch": 1.37,
945
  "learning_rate": 1.3734290843806105e-05,
946
+ "loss": 0.4284,
947
  "step": 1530
948
  },
949
  {
950
  "epoch": 1.38,
951
  "learning_rate": 1.3824057450628366e-05,
952
+ "loss": 0.4096,
953
  "step": 1540
954
  },
955
  {
956
  "epoch": 1.39,
957
  "learning_rate": 1.3913824057450627e-05,
958
+ "loss": 0.4259,
959
  "step": 1550
960
  },
961
  {
962
  "epoch": 1.4,
963
  "learning_rate": 1.4003590664272892e-05,
964
+ "loss": 0.4436,
965
  "step": 1560
966
  },
967
  {
968
  "epoch": 1.41,
969
  "learning_rate": 1.4093357271095153e-05,
970
+ "loss": 0.4453,
971
  "step": 1570
972
  },
973
  {
974
  "epoch": 1.42,
975
  "learning_rate": 1.4183123877917415e-05,
976
+ "loss": 0.4065,
977
  "step": 1580
978
  },
979
  {
980
  "epoch": 1.43,
981
  "learning_rate": 1.4272890484739679e-05,
982
+ "loss": 0.4011,
983
  "step": 1590
984
  },
985
  {
986
  "epoch": 1.44,
987
  "learning_rate": 1.436265709156194e-05,
988
+ "loss": 0.4488,
989
  "step": 1600
990
  },
991
  {
992
  "epoch": 1.44,
993
  "learning_rate": 1.4452423698384202e-05,
994
+ "loss": 0.4122,
995
  "step": 1610
996
  },
997
  {
998
  "epoch": 1.45,
999
  "learning_rate": 1.4542190305206463e-05,
1000
+ "loss": 0.429,
1001
  "step": 1620
1002
  },
1003
  {
1004
  "epoch": 1.46,
1005
  "learning_rate": 1.4631956912028727e-05,
1006
+ "loss": 0.4377,
1007
  "step": 1630
1008
  },
1009
  {
1010
  "epoch": 1.47,
1011
  "learning_rate": 1.4721723518850989e-05,
1012
+ "loss": 0.4186,
1013
  "step": 1640
1014
  },
1015
  {
1016
  "epoch": 1.48,
1017
  "learning_rate": 1.481149012567325e-05,
1018
+ "loss": 0.4063,
1019
  "step": 1650
1020
  },
1021
  {
1022
  "epoch": 1.49,
1023
  "learning_rate": 1.4901256732495511e-05,
1024
+ "loss": 0.4055,
1025
  "step": 1660
1026
  },
1027
  {
1028
  "epoch": 1.5,
1029
  "learning_rate": 1.4991023339317776e-05,
1030
+ "loss": 0.4173,
1031
  "step": 1670
1032
  },
1033
  {
1034
  "epoch": 1.51,
1035
  "learning_rate": 1.5080789946140037e-05,
1036
+ "loss": 0.4361,
1037
  "step": 1680
1038
  },
1039
  {
1040
  "epoch": 1.52,
1041
  "learning_rate": 1.5170556552962298e-05,
1042
+ "loss": 0.4528,
1043
  "step": 1690
1044
  },
1045
  {
1046
  "epoch": 1.53,
1047
  "learning_rate": 1.5260323159784563e-05,
1048
+ "loss": 0.3665,
1049
  "step": 1700
1050
  },
1051
  {
1052
  "epoch": 1.53,
1053
  "learning_rate": 1.5350089766606824e-05,
1054
+ "loss": 0.3913,
1055
  "step": 1710
1056
  },
1057
  {
1058
  "epoch": 1.54,
1059
  "learning_rate": 1.5439856373429085e-05,
1060
+ "loss": 0.4002,
1061
  "step": 1720
1062
  },
1063
  {
1064
  "epoch": 1.55,
1065
  "learning_rate": 1.5529622980251346e-05,
1066
+ "loss": 0.4004,
1067
  "step": 1730
1068
  },
1069
  {
1070
  "epoch": 1.56,
1071
  "learning_rate": 1.561938958707361e-05,
1072
+ "loss": 0.4432,
1073
  "step": 1740
1074
  },
1075
  {
1076
  "epoch": 1.57,
1077
  "learning_rate": 1.5709156193895872e-05,
1078
+ "loss": 0.3743,
1079
  "step": 1750
1080
  },
1081
  {
1082
  "epoch": 1.58,
1083
  "learning_rate": 1.5798922800718133e-05,
1084
+ "loss": 0.3972,
1085
  "step": 1760
1086
  },
1087
  {
1088
  "epoch": 1.59,
1089
  "learning_rate": 1.5888689407540398e-05,
1090
+ "loss": 0.368,
1091
  "step": 1770
1092
  },
1093
  {
1094
  "epoch": 1.6,
1095
  "learning_rate": 1.597845601436266e-05,
1096
+ "loss": 0.4525,
1097
  "step": 1780
1098
  },
1099
  {
1100
  "epoch": 1.61,
1101
  "learning_rate": 1.606822262118492e-05,
1102
+ "loss": 0.3962,
1103
  "step": 1790
1104
  },
1105
  {
1106
  "epoch": 1.61,
1107
  "learning_rate": 1.615798922800718e-05,
1108
+ "loss": 0.3888,
1109
  "step": 1800
1110
  },
1111
  {
1112
  "epoch": 1.62,
1113
  "learning_rate": 1.6247755834829446e-05,
1114
+ "loss": 0.4111,
1115
  "step": 1810
1116
  },
1117
  {
1118
  "epoch": 1.63,
1119
  "learning_rate": 1.6337522441651707e-05,
1120
+ "loss": 0.4084,
1121
  "step": 1820
1122
  },
1123
  {
1124
  "epoch": 1.64,
1125
  "learning_rate": 1.642728904847397e-05,
1126
+ "loss": 0.4181,
1127
  "step": 1830
1128
  },
1129
  {
1130
  "epoch": 1.65,
1131
  "learning_rate": 1.6517055655296233e-05,
1132
+ "loss": 0.4022,
1133
  "step": 1840
1134
  },
1135
  {
1136
  "epoch": 1.66,
1137
  "learning_rate": 1.6606822262118494e-05,
1138
+ "loss": 0.3886,
1139
  "step": 1850
1140
  },
1141
  {
1142
  "epoch": 1.67,
1143
  "learning_rate": 1.6696588868940756e-05,
1144
+ "loss": 0.4092,
1145
  "step": 1860
1146
  },
1147
  {
1148
  "epoch": 1.68,
1149
  "learning_rate": 1.6786355475763017e-05,
1150
+ "loss": 0.3843,
1151
  "step": 1870
1152
  },
1153
  {
1154
  "epoch": 1.69,
1155
  "learning_rate": 1.687612208258528e-05,
1156
+ "loss": 0.4237,
1157
  "step": 1880
1158
  },
1159
  {
1160
  "epoch": 1.7,
1161
  "learning_rate": 1.6965888689407543e-05,
1162
+ "loss": 0.3801,
1163
  "step": 1890
1164
  },
1165
  {
1166
  "epoch": 1.7,
1167
  "learning_rate": 1.7055655296229804e-05,
1168
+ "loss": 0.385,
1169
  "step": 1900
1170
  },
1171
  {
1172
  "epoch": 1.71,
1173
  "learning_rate": 1.7145421903052065e-05,
1174
+ "loss": 0.4452,
1175
  "step": 1910
1176
  },
1177
  {
1178
  "epoch": 1.72,
1179
  "learning_rate": 1.723518850987433e-05,
1180
+ "loss": 0.5147,
1181
  "step": 1920
1182
  },
1183
  {
1184
  "epoch": 1.73,
1185
  "learning_rate": 1.732495511669659e-05,
1186
+ "loss": 0.353,
1187
  "step": 1930
1188
  },
1189
  {
1190
  "epoch": 1.74,
1191
  "learning_rate": 1.7414721723518852e-05,
1192
+ "loss": 0.3816,
1193
  "step": 1940
1194
  },
1195
  {
1196
  "epoch": 1.75,
1197
  "learning_rate": 1.7504488330341113e-05,
1198
+ "loss": 0.361,
1199
  "step": 1950
1200
  },
1201
  {
1202
  "epoch": 1.76,
1203
  "learning_rate": 1.7594254937163378e-05,
1204
+ "loss": 0.3884,
1205
  "step": 1960
1206
  },
1207
  {
1208
  "epoch": 1.77,
1209
  "learning_rate": 1.768402154398564e-05,
1210
+ "loss": 0.3391,
1211
  "step": 1970
1212
  },
1213
  {
1214
  "epoch": 1.78,
1215
  "learning_rate": 1.77737881508079e-05,
1216
+ "loss": 0.4211,
1217
  "step": 1980
1218
  },
1219
  {
1220
  "epoch": 1.79,
1221
  "learning_rate": 1.786355475763016e-05,
1222
+ "loss": 0.3796,
1223
  "step": 1990
1224
  },
1225
  {
1226
  "epoch": 1.79,
1227
  "learning_rate": 1.7953321364452423e-05,
1228
+ "loss": 0.3881,
1229
  "step": 2000
1230
  },
1231
  {
1232
  "epoch": 1.8,
1233
  "learning_rate": 1.8043087971274687e-05,
1234
+ "loss": 0.3904,
1235
  "step": 2010
1236
  },
1237
  {
1238
  "epoch": 1.81,
1239
  "learning_rate": 1.813285457809695e-05,
1240
+ "loss": 0.3845,
1241
  "step": 2020
1242
  },
1243
  {
1244
  "epoch": 1.82,
1245
  "learning_rate": 1.822262118491921e-05,
1246
+ "loss": 0.3721,
1247
  "step": 2030
1248
  },
1249
  {
1250
  "epoch": 1.83,
1251
  "learning_rate": 1.831238779174147e-05,
1252
+ "loss": 0.4141,
1253
  "step": 2040
1254
  },
1255
  {
1256
  "epoch": 1.84,
1257
  "learning_rate": 1.8402154398563732e-05,
1258
+ "loss": 0.3682,
1259
  "step": 2050
1260
  },
1261
  {
1262
  "epoch": 1.85,
1263
  "learning_rate": 1.8491921005385997e-05,
1264
+ "loss": 0.3826,
1265
  "step": 2060
1266
  },
1267
  {
1268
  "epoch": 1.86,
1269
  "learning_rate": 1.8581687612208258e-05,
1270
+ "loss": 0.3588,
1271
  "step": 2070
1272
  },
1273
  {
1274
  "epoch": 1.87,
1275
  "learning_rate": 1.867145421903052e-05,
1276
+ "loss": 0.3663,
1277
  "step": 2080
1278
  },
1279
  {
1280
  "epoch": 1.87,
1281
  "learning_rate": 1.8761220825852784e-05,
1282
+ "loss": 0.4186,
1283
  "step": 2090
1284
  },
1285
  {
1286
  "epoch": 1.88,
1287
  "learning_rate": 1.8850987432675045e-05,
1288
+ "loss": 0.3756,
1289
  "step": 2100
1290
  },
1291
  {
1292
  "epoch": 1.89,
1293
  "learning_rate": 1.8940754039497306e-05,
1294
+ "loss": 0.3655,
1295
  "step": 2110
1296
  },
1297
  {
1298
  "epoch": 1.9,
1299
  "learning_rate": 1.9030520646319568e-05,
1300
+ "loss": 0.4158,
1301
  "step": 2120
1302
  },
1303
  {
1304
  "epoch": 1.91,
1305
  "learning_rate": 1.9120287253141832e-05,
1306
+ "loss": 0.3985,
1307
  "step": 2130
1308
  },
1309
  {
1310
  "epoch": 1.92,
1311
  "learning_rate": 1.9210053859964093e-05,
1312
+ "loss": 0.3955,
1313
  "step": 2140
1314
  },
1315
  {
1316
  "epoch": 1.93,
1317
  "learning_rate": 1.9299820466786355e-05,
1318
+ "loss": 0.3757,
1319
  "step": 2150
1320
  },
1321
  {
1322
  "epoch": 1.94,
1323
  "learning_rate": 1.9389587073608616e-05,
1324
+ "loss": 0.3712,
1325
  "step": 2160
1326
  },
1327
  {
1328
  "epoch": 1.95,
1329
  "learning_rate": 1.947935368043088e-05,
1330
+ "loss": 0.3723,
1331
  "step": 2170
1332
  },
1333
  {
1334
  "epoch": 1.96,
1335
  "learning_rate": 1.9569120287253142e-05,
1336
+ "loss": 0.367,
1337
  "step": 2180
1338
  },
1339
  {
1340
  "epoch": 1.96,
1341
  "learning_rate": 1.9658886894075403e-05,
1342
+ "loss": 0.3659,
1343
  "step": 2190
1344
  },
1345
  {
1346
  "epoch": 1.97,
1347
  "learning_rate": 1.9748653500897668e-05,
1348
+ "loss": 0.3752,
1349
  "step": 2200
1350
  },
1351
  {
1352
  "epoch": 1.98,
1353
  "learning_rate": 1.983842010771993e-05,
1354
+ "loss": 0.318,
1355
  "step": 2210
1356
  },
1357
  {
1358
  "epoch": 1.99,
1359
  "learning_rate": 1.992818671454219e-05,
1360
+ "loss": 0.3696,
1361
  "step": 2220
1362
  },
1363
  {
1364
  "epoch": 2.0,
1365
  "eval_accuracy": {
1366
+ "accuracy": 0.9249271137026239
1367
  },
1368
  "eval_f1": {
1369
+ "f1": 0.9207602119769538
1370
  },
1371
+ "eval_loss": 0.2492757886648178,
1372
  "eval_precision": {
1373
+ "precision": 0.9199949527238288
1374
  },
1375
  "eval_recall": {
1376
+ "recall": 0.9219224853720074
1377
  },
1378
+ "eval_runtime": 166.1808,
1379
+ "eval_samples_per_second": 107.329,
1380
+ "eval_steps_per_second": 6.71,
1381
  "step": 2229
1382
  }
1383
  ],
tmp-checkpoint-2229/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3394b871720811033add862f1e1383ca3790e6ab55972b19ed900a5d6b59c978
3
  size 4792
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c55fb57ba4dc2c9b2c813516c4846a21f1047b19b6cf48a97b9224ced523b9b
3
  size 4792