mmomm25 commited on
Commit
07cff62
1 Parent(s): fece4d1

Training in progress, epoch 0

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b5601532bb74198b0a27893b6eb80cb42adfdb3f3e4928eb8e76270450fa388c
3
  size 343230128
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5351ced59e7c85a3fb2f7c177c877ac1785f0eb288bcfa15c371ef575b43f0b
3
  size 343230128
tmp-checkpoint-1114/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b47f93d99bd37fbd6c9539d6cf2445f64dc4b1117213676268c598408139ee02
3
  size 343230128
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5351ced59e7c85a3fb2f7c177c877ac1785f0eb288bcfa15c371ef575b43f0b
3
  size 343230128
tmp-checkpoint-1114/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:64dd87c6814b49faccd074f8570112764ba4f50313926e9021cb6a6ba0611322
3
  size 686581178
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec00798806d5720e65e019906ab50a6c32a2e71b4e04445be9e06392939427dc
3
  size 686581178
tmp-checkpoint-1114/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:14a82bd7aac7f48f94a640c01bb3e50324f04a791daa0d0bad2d6efb342e3a54
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24b3a83bdc525e31fc774b467e5328a4a4771dbb41e450889d48b38e20ba1bfc
3
  size 14244
tmp-checkpoint-1114/trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.40481075644493103,
3
  "best_model_checkpoint": "vit-base-patch16-224-in21k-crack-detectorVITmain50epochs\\checkpoint-1114",
4
  "epoch": 0.9993272034088361,
5
  "eval_steps": 500,
@@ -11,687 +11,687 @@
11
  {
12
  "epoch": 0.01,
13
  "learning_rate": 8.976660682226213e-08,
14
- "loss": 1.3944,
15
  "step": 10
16
  },
17
  {
18
  "epoch": 0.02,
19
  "learning_rate": 1.7953321364452426e-07,
20
- "loss": 1.3875,
21
  "step": 20
22
  },
23
  {
24
  "epoch": 0.03,
25
  "learning_rate": 2.692998204667864e-07,
26
- "loss": 1.3999,
27
  "step": 30
28
  },
29
  {
30
  "epoch": 0.04,
31
  "learning_rate": 3.590664272890485e-07,
32
- "loss": 1.3915,
33
  "step": 40
34
  },
35
  {
36
  "epoch": 0.04,
37
  "learning_rate": 4.4883303411131064e-07,
38
- "loss": 1.3856,
39
  "step": 50
40
  },
41
  {
42
  "epoch": 0.05,
43
  "learning_rate": 5.385996409335728e-07,
44
- "loss": 1.3912,
45
  "step": 60
46
  },
47
  {
48
  "epoch": 0.06,
49
  "learning_rate": 6.283662477558349e-07,
50
- "loss": 1.3902,
51
  "step": 70
52
  },
53
  {
54
  "epoch": 0.07,
55
  "learning_rate": 7.18132854578097e-07,
56
- "loss": 1.3851,
57
  "step": 80
58
  },
59
  {
60
  "epoch": 0.08,
61
  "learning_rate": 8.078994614003591e-07,
62
- "loss": 1.3755,
63
  "step": 90
64
  },
65
  {
66
  "epoch": 0.09,
67
  "learning_rate": 8.976660682226213e-07,
68
- "loss": 1.3793,
69
  "step": 100
70
  },
71
  {
72
  "epoch": 0.1,
73
  "learning_rate": 9.874326750448833e-07,
74
- "loss": 1.3737,
75
  "step": 110
76
  },
77
  {
78
  "epoch": 0.11,
79
  "learning_rate": 1.0771992818671456e-06,
80
- "loss": 1.3736,
81
  "step": 120
82
  },
83
  {
84
  "epoch": 0.12,
85
  "learning_rate": 1.1669658886894075e-06,
86
- "loss": 1.3678,
87
  "step": 130
88
  },
89
  {
90
  "epoch": 0.13,
91
  "learning_rate": 1.2567324955116697e-06,
92
- "loss": 1.3637,
93
  "step": 140
94
  },
95
  {
96
  "epoch": 0.13,
97
  "learning_rate": 1.3464991023339318e-06,
98
- "loss": 1.357,
99
  "step": 150
100
  },
101
  {
102
  "epoch": 0.14,
103
  "learning_rate": 1.436265709156194e-06,
104
- "loss": 1.3583,
105
  "step": 160
106
  },
107
  {
108
  "epoch": 0.15,
109
  "learning_rate": 1.5260323159784561e-06,
110
- "loss": 1.361,
111
  "step": 170
112
  },
113
  {
114
  "epoch": 0.16,
115
  "learning_rate": 1.6157989228007182e-06,
116
- "loss": 1.3517,
117
  "step": 180
118
  },
119
  {
120
  "epoch": 0.17,
121
  "learning_rate": 1.7055655296229805e-06,
122
- "loss": 1.3543,
123
  "step": 190
124
  },
125
  {
126
  "epoch": 0.18,
127
  "learning_rate": 1.7953321364452425e-06,
128
- "loss": 1.3497,
129
  "step": 200
130
  },
131
  {
132
  "epoch": 0.19,
133
  "learning_rate": 1.8850987432675046e-06,
134
- "loss": 1.3436,
135
  "step": 210
136
  },
137
  {
138
  "epoch": 0.2,
139
  "learning_rate": 1.9748653500897667e-06,
140
- "loss": 1.3304,
141
  "step": 220
142
  },
143
  {
144
  "epoch": 0.21,
145
  "learning_rate": 2.064631956912029e-06,
146
- "loss": 1.3262,
147
  "step": 230
148
  },
149
  {
150
  "epoch": 0.22,
151
  "learning_rate": 2.1543985637342912e-06,
152
- "loss": 1.3209,
153
  "step": 240
154
  },
155
  {
156
  "epoch": 0.22,
157
  "learning_rate": 2.244165170556553e-06,
158
- "loss": 1.3054,
159
  "step": 250
160
  },
161
  {
162
  "epoch": 0.23,
163
  "learning_rate": 2.333931777378815e-06,
164
- "loss": 1.3028,
165
  "step": 260
166
  },
167
  {
168
  "epoch": 0.24,
169
  "learning_rate": 2.423698384201077e-06,
170
- "loss": 1.2939,
171
  "step": 270
172
  },
173
  {
174
  "epoch": 0.25,
175
  "learning_rate": 2.5134649910233395e-06,
176
- "loss": 1.2894,
177
  "step": 280
178
  },
179
  {
180
  "epoch": 0.26,
181
  "learning_rate": 2.6032315978456015e-06,
182
- "loss": 1.2838,
183
  "step": 290
184
  },
185
  {
186
  "epoch": 0.27,
187
  "learning_rate": 2.6929982046678636e-06,
188
- "loss": 1.2625,
189
  "step": 300
190
  },
191
  {
192
  "epoch": 0.28,
193
  "learning_rate": 2.7827648114901257e-06,
194
- "loss": 1.2727,
195
  "step": 310
196
  },
197
  {
198
  "epoch": 0.29,
199
  "learning_rate": 2.872531418312388e-06,
200
- "loss": 1.2398,
201
  "step": 320
202
  },
203
  {
204
  "epoch": 0.3,
205
  "learning_rate": 2.9622980251346502e-06,
206
- "loss": 1.2267,
207
  "step": 330
208
  },
209
  {
210
  "epoch": 0.31,
211
  "learning_rate": 3.0520646319569123e-06,
212
- "loss": 1.2359,
213
  "step": 340
214
  },
215
  {
216
  "epoch": 0.31,
217
  "learning_rate": 3.1418312387791743e-06,
218
- "loss": 1.218,
219
  "step": 350
220
  },
221
  {
222
  "epoch": 0.32,
223
  "learning_rate": 3.2315978456014364e-06,
224
- "loss": 1.1877,
225
  "step": 360
226
  },
227
  {
228
  "epoch": 0.33,
229
  "learning_rate": 3.321364452423698e-06,
230
- "loss": 1.1764,
231
  "step": 370
232
  },
233
  {
234
  "epoch": 0.34,
235
  "learning_rate": 3.411131059245961e-06,
236
- "loss": 1.151,
237
  "step": 380
238
  },
239
  {
240
  "epoch": 0.35,
241
  "learning_rate": 3.500897666068223e-06,
242
- "loss": 1.1334,
243
  "step": 390
244
  },
245
  {
246
  "epoch": 0.36,
247
  "learning_rate": 3.590664272890485e-06,
248
- "loss": 1.1272,
249
  "step": 400
250
  },
251
  {
252
  "epoch": 0.37,
253
  "learning_rate": 3.680430879712747e-06,
254
- "loss": 1.1077,
255
  "step": 410
256
  },
257
  {
258
  "epoch": 0.38,
259
  "learning_rate": 3.770197486535009e-06,
260
- "loss": 1.1021,
261
  "step": 420
262
  },
263
  {
264
  "epoch": 0.39,
265
  "learning_rate": 3.859964093357271e-06,
266
- "loss": 1.0583,
267
  "step": 430
268
  },
269
  {
270
  "epoch": 0.39,
271
  "learning_rate": 3.949730700179533e-06,
272
- "loss": 1.0482,
273
  "step": 440
274
  },
275
  {
276
  "epoch": 0.4,
277
  "learning_rate": 4.039497307001795e-06,
278
- "loss": 1.0214,
279
  "step": 450
280
  },
281
  {
282
  "epoch": 0.41,
283
  "learning_rate": 4.129263913824058e-06,
284
- "loss": 1.0114,
285
  "step": 460
286
  },
287
  {
288
  "epoch": 0.42,
289
  "learning_rate": 4.21903052064632e-06,
290
- "loss": 1.0237,
291
  "step": 470
292
  },
293
  {
294
  "epoch": 0.43,
295
  "learning_rate": 4.3087971274685824e-06,
296
- "loss": 0.969,
297
  "step": 480
298
  },
299
  {
300
  "epoch": 0.44,
301
  "learning_rate": 4.3985637342908445e-06,
302
- "loss": 0.966,
303
  "step": 490
304
  },
305
  {
306
  "epoch": 0.45,
307
  "learning_rate": 4.488330341113106e-06,
308
- "loss": 0.9518,
309
  "step": 500
310
  },
311
  {
312
  "epoch": 0.46,
313
  "learning_rate": 4.578096947935368e-06,
314
- "loss": 0.9545,
315
  "step": 510
316
  },
317
  {
318
  "epoch": 0.47,
319
  "learning_rate": 4.66786355475763e-06,
320
- "loss": 0.9473,
321
  "step": 520
322
  },
323
  {
324
  "epoch": 0.48,
325
  "learning_rate": 4.757630161579892e-06,
326
- "loss": 0.9026,
327
  "step": 530
328
  },
329
  {
330
  "epoch": 0.48,
331
  "learning_rate": 4.847396768402154e-06,
332
- "loss": 0.8535,
333
  "step": 540
334
  },
335
  {
336
  "epoch": 0.49,
337
  "learning_rate": 4.937163375224417e-06,
338
- "loss": 0.8598,
339
  "step": 550
340
  },
341
  {
342
  "epoch": 0.5,
343
  "learning_rate": 5.026929982046679e-06,
344
- "loss": 0.8154,
345
  "step": 560
346
  },
347
  {
348
  "epoch": 0.51,
349
  "learning_rate": 5.116696588868941e-06,
350
- "loss": 0.8561,
351
  "step": 570
352
  },
353
  {
354
  "epoch": 0.52,
355
  "learning_rate": 5.206463195691203e-06,
356
- "loss": 0.7924,
357
  "step": 580
358
  },
359
  {
360
  "epoch": 0.53,
361
  "learning_rate": 5.296229802513465e-06,
362
- "loss": 0.7947,
363
  "step": 590
364
  },
365
  {
366
  "epoch": 0.54,
367
  "learning_rate": 5.385996409335727e-06,
368
- "loss": 0.7999,
369
  "step": 600
370
  },
371
  {
372
  "epoch": 0.55,
373
  "learning_rate": 5.475763016157989e-06,
374
- "loss": 0.7771,
375
  "step": 610
376
  },
377
  {
378
  "epoch": 0.56,
379
  "learning_rate": 5.565529622980251e-06,
380
- "loss": 0.7826,
381
  "step": 620
382
  },
383
  {
384
  "epoch": 0.57,
385
  "learning_rate": 5.655296229802514e-06,
386
- "loss": 0.7321,
387
  "step": 630
388
  },
389
  {
390
  "epoch": 0.57,
391
  "learning_rate": 5.745062836624776e-06,
392
- "loss": 0.7689,
393
  "step": 640
394
  },
395
  {
396
  "epoch": 0.58,
397
  "learning_rate": 5.834829443447038e-06,
398
- "loss": 0.7546,
399
  "step": 650
400
  },
401
  {
402
  "epoch": 0.59,
403
  "learning_rate": 5.9245960502693004e-06,
404
- "loss": 0.7336,
405
  "step": 660
406
  },
407
  {
408
  "epoch": 0.6,
409
  "learning_rate": 6.0143626570915625e-06,
410
- "loss": 0.6889,
411
  "step": 670
412
  },
413
  {
414
  "epoch": 0.61,
415
  "learning_rate": 6.1041292639138246e-06,
416
- "loss": 0.6996,
417
  "step": 680
418
  },
419
  {
420
  "epoch": 0.62,
421
  "learning_rate": 6.193895870736087e-06,
422
- "loss": 0.6994,
423
  "step": 690
424
  },
425
  {
426
  "epoch": 0.63,
427
  "learning_rate": 6.283662477558349e-06,
428
- "loss": 0.74,
429
  "step": 700
430
  },
431
  {
432
  "epoch": 0.64,
433
  "learning_rate": 6.373429084380611e-06,
434
- "loss": 0.711,
435
  "step": 710
436
  },
437
  {
438
  "epoch": 0.65,
439
  "learning_rate": 6.463195691202873e-06,
440
- "loss": 0.6765,
441
  "step": 720
442
  },
443
  {
444
  "epoch": 0.65,
445
  "learning_rate": 6.552962298025135e-06,
446
- "loss": 0.6717,
447
  "step": 730
448
  },
449
  {
450
  "epoch": 0.66,
451
  "learning_rate": 6.642728904847396e-06,
452
- "loss": 0.6776,
453
  "step": 740
454
  },
455
  {
456
  "epoch": 0.67,
457
  "learning_rate": 6.732495511669659e-06,
458
- "loss": 0.62,
459
  "step": 750
460
  },
461
  {
462
  "epoch": 0.68,
463
  "learning_rate": 6.822262118491922e-06,
464
- "loss": 0.6392,
465
  "step": 760
466
  },
467
  {
468
  "epoch": 0.69,
469
  "learning_rate": 6.912028725314183e-06,
470
- "loss": 0.62,
471
  "step": 770
472
  },
473
  {
474
  "epoch": 0.7,
475
  "learning_rate": 7.001795332136446e-06,
476
- "loss": 0.6103,
477
  "step": 780
478
  },
479
  {
480
  "epoch": 0.71,
481
  "learning_rate": 7.091561938958707e-06,
482
- "loss": 0.6504,
483
  "step": 790
484
  },
485
  {
486
  "epoch": 0.72,
487
  "learning_rate": 7.18132854578097e-06,
488
- "loss": 0.6126,
489
  "step": 800
490
  },
491
  {
492
  "epoch": 0.73,
493
  "learning_rate": 7.271095152603231e-06,
494
- "loss": 0.5707,
495
  "step": 810
496
  },
497
  {
498
  "epoch": 0.74,
499
  "learning_rate": 7.360861759425494e-06,
500
- "loss": 0.587,
501
  "step": 820
502
  },
503
  {
504
  "epoch": 0.74,
505
  "learning_rate": 7.4506283662477555e-06,
506
- "loss": 0.5684,
507
  "step": 830
508
  },
509
  {
510
  "epoch": 0.75,
511
  "learning_rate": 7.540394973070018e-06,
512
- "loss": 0.5586,
513
  "step": 840
514
  },
515
  {
516
  "epoch": 0.76,
517
  "learning_rate": 7.630161579892281e-06,
518
- "loss": 0.6074,
519
  "step": 850
520
  },
521
  {
522
  "epoch": 0.77,
523
  "learning_rate": 7.719928186714543e-06,
524
- "loss": 0.5638,
525
  "step": 860
526
  },
527
  {
528
  "epoch": 0.78,
529
  "learning_rate": 7.809694793536805e-06,
530
- "loss": 0.5952,
531
  "step": 870
532
  },
533
  {
534
  "epoch": 0.79,
535
  "learning_rate": 7.899461400359067e-06,
536
- "loss": 0.5647,
537
  "step": 880
538
  },
539
  {
540
  "epoch": 0.8,
541
  "learning_rate": 7.98922800718133e-06,
542
- "loss": 0.6049,
543
  "step": 890
544
  },
545
  {
546
  "epoch": 0.81,
547
  "learning_rate": 8.07899461400359e-06,
548
- "loss": 0.5525,
549
  "step": 900
550
  },
551
  {
552
  "epoch": 0.82,
553
  "learning_rate": 8.168761220825854e-06,
554
- "loss": 0.522,
555
  "step": 910
556
  },
557
  {
558
  "epoch": 0.83,
559
  "learning_rate": 8.258527827648117e-06,
560
- "loss": 0.5489,
561
  "step": 920
562
  },
563
  {
564
  "epoch": 0.83,
565
  "learning_rate": 8.348294434470378e-06,
566
- "loss": 0.5394,
567
  "step": 930
568
  },
569
  {
570
  "epoch": 0.84,
571
  "learning_rate": 8.43806104129264e-06,
572
- "loss": 0.5707,
573
  "step": 940
574
  },
575
  {
576
  "epoch": 0.85,
577
  "learning_rate": 8.527827648114902e-06,
578
- "loss": 0.5322,
579
  "step": 950
580
  },
581
  {
582
  "epoch": 0.86,
583
  "learning_rate": 8.617594254937165e-06,
584
- "loss": 0.5637,
585
  "step": 960
586
  },
587
  {
588
  "epoch": 0.87,
589
  "learning_rate": 8.707360861759426e-06,
590
- "loss": 0.529,
591
  "step": 970
592
  },
593
  {
594
  "epoch": 0.88,
595
  "learning_rate": 8.797127468581689e-06,
596
- "loss": 0.51,
597
  "step": 980
598
  },
599
  {
600
  "epoch": 0.89,
601
  "learning_rate": 8.88689407540395e-06,
602
- "loss": 0.4844,
603
  "step": 990
604
  },
605
  {
606
  "epoch": 0.9,
607
  "learning_rate": 8.976660682226211e-06,
608
- "loss": 0.5349,
609
  "step": 1000
610
  },
611
  {
612
  "epoch": 0.91,
613
  "learning_rate": 9.066427289048474e-06,
614
- "loss": 0.5377,
615
  "step": 1010
616
  },
617
  {
618
  "epoch": 0.92,
619
  "learning_rate": 9.156193895870736e-06,
620
- "loss": 0.4985,
621
  "step": 1020
622
  },
623
  {
624
  "epoch": 0.92,
625
  "learning_rate": 9.245960502692998e-06,
626
- "loss": 0.5533,
627
  "step": 1030
628
  },
629
  {
630
  "epoch": 0.93,
631
  "learning_rate": 9.33572710951526e-06,
632
- "loss": 0.4955,
633
  "step": 1040
634
  },
635
  {
636
  "epoch": 0.94,
637
  "learning_rate": 9.425493716337523e-06,
638
- "loss": 0.541,
639
  "step": 1050
640
  },
641
  {
642
  "epoch": 0.95,
643
  "learning_rate": 9.515260323159784e-06,
644
- "loss": 0.4757,
645
  "step": 1060
646
  },
647
  {
648
  "epoch": 0.96,
649
  "learning_rate": 9.605026929982047e-06,
650
- "loss": 0.5478,
651
  "step": 1070
652
  },
653
  {
654
  "epoch": 0.97,
655
  "learning_rate": 9.694793536804308e-06,
656
- "loss": 0.5281,
657
  "step": 1080
658
  },
659
  {
660
  "epoch": 0.98,
661
  "learning_rate": 9.784560143626571e-06,
662
- "loss": 0.5187,
663
  "step": 1090
664
  },
665
  {
666
  "epoch": 0.99,
667
  "learning_rate": 9.874326750448834e-06,
668
- "loss": 0.4591,
669
  "step": 1100
670
  },
671
  {
672
  "epoch": 1.0,
673
  "learning_rate": 9.964093357271095e-06,
674
- "loss": 0.5344,
675
  "step": 1110
676
  },
677
  {
678
  "epoch": 1.0,
679
  "eval_accuracy": {
680
- "accuracy": 0.8744113029827315
681
  },
682
  "eval_f1": {
683
- "f1": 0.8645201833830978
684
  },
685
- "eval_loss": 0.40481075644493103,
686
  "eval_precision": {
687
- "precision": 0.8668175457367389
688
  },
689
  "eval_recall": {
690
- "recall": 0.8631211355155497
691
  },
692
- "eval_runtime": 243.6123,
693
- "eval_samples_per_second": 73.215,
694
- "eval_steps_per_second": 4.577,
695
  "step": 1114
696
  }
697
  ],
 
1
  {
2
+ "best_metric": 0.4108576774597168,
3
  "best_model_checkpoint": "vit-base-patch16-224-in21k-crack-detectorVITmain50epochs\\checkpoint-1114",
4
  "epoch": 0.9993272034088361,
5
  "eval_steps": 500,
 
11
  {
12
  "epoch": 0.01,
13
  "learning_rate": 8.976660682226213e-08,
14
+ "loss": 1.3961,
15
  "step": 10
16
  },
17
  {
18
  "epoch": 0.02,
19
  "learning_rate": 1.7953321364452426e-07,
20
+ "loss": 1.395,
21
  "step": 20
22
  },
23
  {
24
  "epoch": 0.03,
25
  "learning_rate": 2.692998204667864e-07,
26
+ "loss": 1.3978,
27
  "step": 30
28
  },
29
  {
30
  "epoch": 0.04,
31
  "learning_rate": 3.590664272890485e-07,
32
+ "loss": 1.3963,
33
  "step": 40
34
  },
35
  {
36
  "epoch": 0.04,
37
  "learning_rate": 4.4883303411131064e-07,
38
+ "loss": 1.3907,
39
  "step": 50
40
  },
41
  {
42
  "epoch": 0.05,
43
  "learning_rate": 5.385996409335728e-07,
44
+ "loss": 1.396,
45
  "step": 60
46
  },
47
  {
48
  "epoch": 0.06,
49
  "learning_rate": 6.283662477558349e-07,
50
+ "loss": 1.3885,
51
  "step": 70
52
  },
53
  {
54
  "epoch": 0.07,
55
  "learning_rate": 7.18132854578097e-07,
56
+ "loss": 1.387,
57
  "step": 80
58
  },
59
  {
60
  "epoch": 0.08,
61
  "learning_rate": 8.078994614003591e-07,
62
+ "loss": 1.3894,
63
  "step": 90
64
  },
65
  {
66
  "epoch": 0.09,
67
  "learning_rate": 8.976660682226213e-07,
68
+ "loss": 1.3806,
69
  "step": 100
70
  },
71
  {
72
  "epoch": 0.1,
73
  "learning_rate": 9.874326750448833e-07,
74
+ "loss": 1.383,
75
  "step": 110
76
  },
77
  {
78
  "epoch": 0.11,
79
  "learning_rate": 1.0771992818671456e-06,
80
+ "loss": 1.3764,
81
  "step": 120
82
  },
83
  {
84
  "epoch": 0.12,
85
  "learning_rate": 1.1669658886894075e-06,
86
+ "loss": 1.3688,
87
  "step": 130
88
  },
89
  {
90
  "epoch": 0.13,
91
  "learning_rate": 1.2567324955116697e-06,
92
+ "loss": 1.3708,
93
  "step": 140
94
  },
95
  {
96
  "epoch": 0.13,
97
  "learning_rate": 1.3464991023339318e-06,
98
+ "loss": 1.366,
99
  "step": 150
100
  },
101
  {
102
  "epoch": 0.14,
103
  "learning_rate": 1.436265709156194e-06,
104
+ "loss": 1.371,
105
  "step": 160
106
  },
107
  {
108
  "epoch": 0.15,
109
  "learning_rate": 1.5260323159784561e-06,
110
+ "loss": 1.3558,
111
  "step": 170
112
  },
113
  {
114
  "epoch": 0.16,
115
  "learning_rate": 1.6157989228007182e-06,
116
+ "loss": 1.3584,
117
  "step": 180
118
  },
119
  {
120
  "epoch": 0.17,
121
  "learning_rate": 1.7055655296229805e-06,
122
+ "loss": 1.3409,
123
  "step": 190
124
  },
125
  {
126
  "epoch": 0.18,
127
  "learning_rate": 1.7953321364452425e-06,
128
+ "loss": 1.346,
129
  "step": 200
130
  },
131
  {
132
  "epoch": 0.19,
133
  "learning_rate": 1.8850987432675046e-06,
134
+ "loss": 1.3355,
135
  "step": 210
136
  },
137
  {
138
  "epoch": 0.2,
139
  "learning_rate": 1.9748653500897667e-06,
140
+ "loss": 1.3323,
141
  "step": 220
142
  },
143
  {
144
  "epoch": 0.21,
145
  "learning_rate": 2.064631956912029e-06,
146
+ "loss": 1.3231,
147
  "step": 230
148
  },
149
  {
150
  "epoch": 0.22,
151
  "learning_rate": 2.1543985637342912e-06,
152
+ "loss": 1.3129,
153
  "step": 240
154
  },
155
  {
156
  "epoch": 0.22,
157
  "learning_rate": 2.244165170556553e-06,
158
+ "loss": 1.3178,
159
  "step": 250
160
  },
161
  {
162
  "epoch": 0.23,
163
  "learning_rate": 2.333931777378815e-06,
164
+ "loss": 1.2953,
165
  "step": 260
166
  },
167
  {
168
  "epoch": 0.24,
169
  "learning_rate": 2.423698384201077e-06,
170
+ "loss": 1.2938,
171
  "step": 270
172
  },
173
  {
174
  "epoch": 0.25,
175
  "learning_rate": 2.5134649910233395e-06,
176
+ "loss": 1.2849,
177
  "step": 280
178
  },
179
  {
180
  "epoch": 0.26,
181
  "learning_rate": 2.6032315978456015e-06,
182
+ "loss": 1.2813,
183
  "step": 290
184
  },
185
  {
186
  "epoch": 0.27,
187
  "learning_rate": 2.6929982046678636e-06,
188
+ "loss": 1.2811,
189
  "step": 300
190
  },
191
  {
192
  "epoch": 0.28,
193
  "learning_rate": 2.7827648114901257e-06,
194
+ "loss": 1.2526,
195
  "step": 310
196
  },
197
  {
198
  "epoch": 0.29,
199
  "learning_rate": 2.872531418312388e-06,
200
+ "loss": 1.2438,
201
  "step": 320
202
  },
203
  {
204
  "epoch": 0.3,
205
  "learning_rate": 2.9622980251346502e-06,
206
+ "loss": 1.2145,
207
  "step": 330
208
  },
209
  {
210
  "epoch": 0.31,
211
  "learning_rate": 3.0520646319569123e-06,
212
+ "loss": 1.2146,
213
  "step": 340
214
  },
215
  {
216
  "epoch": 0.31,
217
  "learning_rate": 3.1418312387791743e-06,
218
+ "loss": 1.1883,
219
  "step": 350
220
  },
221
  {
222
  "epoch": 0.32,
223
  "learning_rate": 3.2315978456014364e-06,
224
+ "loss": 1.1891,
225
  "step": 360
226
  },
227
  {
228
  "epoch": 0.33,
229
  "learning_rate": 3.321364452423698e-06,
230
+ "loss": 1.1723,
231
  "step": 370
232
  },
233
  {
234
  "epoch": 0.34,
235
  "learning_rate": 3.411131059245961e-06,
236
+ "loss": 1.1417,
237
  "step": 380
238
  },
239
  {
240
  "epoch": 0.35,
241
  "learning_rate": 3.500897666068223e-06,
242
+ "loss": 1.1338,
243
  "step": 390
244
  },
245
  {
246
  "epoch": 0.36,
247
  "learning_rate": 3.590664272890485e-06,
248
+ "loss": 1.1004,
249
  "step": 400
250
  },
251
  {
252
  "epoch": 0.37,
253
  "learning_rate": 3.680430879712747e-06,
254
+ "loss": 1.0873,
255
  "step": 410
256
  },
257
  {
258
  "epoch": 0.38,
259
  "learning_rate": 3.770197486535009e-06,
260
+ "loss": 1.0358,
261
  "step": 420
262
  },
263
  {
264
  "epoch": 0.39,
265
  "learning_rate": 3.859964093357271e-06,
266
+ "loss": 1.0517,
267
  "step": 430
268
  },
269
  {
270
  "epoch": 0.39,
271
  "learning_rate": 3.949730700179533e-06,
272
+ "loss": 1.0139,
273
  "step": 440
274
  },
275
  {
276
  "epoch": 0.4,
277
  "learning_rate": 4.039497307001795e-06,
278
+ "loss": 1.0294,
279
  "step": 450
280
  },
281
  {
282
  "epoch": 0.41,
283
  "learning_rate": 4.129263913824058e-06,
284
+ "loss": 1.0171,
285
  "step": 460
286
  },
287
  {
288
  "epoch": 0.42,
289
  "learning_rate": 4.21903052064632e-06,
290
+ "loss": 0.9827,
291
  "step": 470
292
  },
293
  {
294
  "epoch": 0.43,
295
  "learning_rate": 4.3087971274685824e-06,
296
+ "loss": 0.9382,
297
  "step": 480
298
  },
299
  {
300
  "epoch": 0.44,
301
  "learning_rate": 4.3985637342908445e-06,
302
+ "loss": 0.9145,
303
  "step": 490
304
  },
305
  {
306
  "epoch": 0.45,
307
  "learning_rate": 4.488330341113106e-06,
308
+ "loss": 0.9276,
309
  "step": 500
310
  },
311
  {
312
  "epoch": 0.46,
313
  "learning_rate": 4.578096947935368e-06,
314
+ "loss": 0.8801,
315
  "step": 510
316
  },
317
  {
318
  "epoch": 0.47,
319
  "learning_rate": 4.66786355475763e-06,
320
+ "loss": 0.8906,
321
  "step": 520
322
  },
323
  {
324
  "epoch": 0.48,
325
  "learning_rate": 4.757630161579892e-06,
326
+ "loss": 0.9025,
327
  "step": 530
328
  },
329
  {
330
  "epoch": 0.48,
331
  "learning_rate": 4.847396768402154e-06,
332
+ "loss": 0.8621,
333
  "step": 540
334
  },
335
  {
336
  "epoch": 0.49,
337
  "learning_rate": 4.937163375224417e-06,
338
+ "loss": 0.8653,
339
  "step": 550
340
  },
341
  {
342
  "epoch": 0.5,
343
  "learning_rate": 5.026929982046679e-06,
344
+ "loss": 0.8292,
345
  "step": 560
346
  },
347
  {
348
  "epoch": 0.51,
349
  "learning_rate": 5.116696588868941e-06,
350
+ "loss": 0.8195,
351
  "step": 570
352
  },
353
  {
354
  "epoch": 0.52,
355
  "learning_rate": 5.206463195691203e-06,
356
+ "loss": 0.8026,
357
  "step": 580
358
  },
359
  {
360
  "epoch": 0.53,
361
  "learning_rate": 5.296229802513465e-06,
362
+ "loss": 0.841,
363
  "step": 590
364
  },
365
  {
366
  "epoch": 0.54,
367
  "learning_rate": 5.385996409335727e-06,
368
+ "loss": 0.778,
369
  "step": 600
370
  },
371
  {
372
  "epoch": 0.55,
373
  "learning_rate": 5.475763016157989e-06,
374
+ "loss": 0.7706,
375
  "step": 610
376
  },
377
  {
378
  "epoch": 0.56,
379
  "learning_rate": 5.565529622980251e-06,
380
+ "loss": 0.733,
381
  "step": 620
382
  },
383
  {
384
  "epoch": 0.57,
385
  "learning_rate": 5.655296229802514e-06,
386
+ "loss": 0.7437,
387
  "step": 630
388
  },
389
  {
390
  "epoch": 0.57,
391
  "learning_rate": 5.745062836624776e-06,
392
+ "loss": 0.7644,
393
  "step": 640
394
  },
395
  {
396
  "epoch": 0.58,
397
  "learning_rate": 5.834829443447038e-06,
398
+ "loss": 0.7125,
399
  "step": 650
400
  },
401
  {
402
  "epoch": 0.59,
403
  "learning_rate": 5.9245960502693004e-06,
404
+ "loss": 0.7146,
405
  "step": 660
406
  },
407
  {
408
  "epoch": 0.6,
409
  "learning_rate": 6.0143626570915625e-06,
410
+ "loss": 0.7201,
411
  "step": 670
412
  },
413
  {
414
  "epoch": 0.61,
415
  "learning_rate": 6.1041292639138246e-06,
416
+ "loss": 0.6851,
417
  "step": 680
418
  },
419
  {
420
  "epoch": 0.62,
421
  "learning_rate": 6.193895870736087e-06,
422
+ "loss": 0.6417,
423
  "step": 690
424
  },
425
  {
426
  "epoch": 0.63,
427
  "learning_rate": 6.283662477558349e-06,
428
+ "loss": 0.6656,
429
  "step": 700
430
  },
431
  {
432
  "epoch": 0.64,
433
  "learning_rate": 6.373429084380611e-06,
434
+ "loss": 0.6122,
435
  "step": 710
436
  },
437
  {
438
  "epoch": 0.65,
439
  "learning_rate": 6.463195691202873e-06,
440
+ "loss": 0.6536,
441
  "step": 720
442
  },
443
  {
444
  "epoch": 0.65,
445
  "learning_rate": 6.552962298025135e-06,
446
+ "loss": 0.6315,
447
  "step": 730
448
  },
449
  {
450
  "epoch": 0.66,
451
  "learning_rate": 6.642728904847396e-06,
452
+ "loss": 0.6618,
453
  "step": 740
454
  },
455
  {
456
  "epoch": 0.67,
457
  "learning_rate": 6.732495511669659e-06,
458
+ "loss": 0.6346,
459
  "step": 750
460
  },
461
  {
462
  "epoch": 0.68,
463
  "learning_rate": 6.822262118491922e-06,
464
+ "loss": 0.6866,
465
  "step": 760
466
  },
467
  {
468
  "epoch": 0.69,
469
  "learning_rate": 6.912028725314183e-06,
470
+ "loss": 0.6093,
471
  "step": 770
472
  },
473
  {
474
  "epoch": 0.7,
475
  "learning_rate": 7.001795332136446e-06,
476
+ "loss": 0.6116,
477
  "step": 780
478
  },
479
  {
480
  "epoch": 0.71,
481
  "learning_rate": 7.091561938958707e-06,
482
+ "loss": 0.602,
483
  "step": 790
484
  },
485
  {
486
  "epoch": 0.72,
487
  "learning_rate": 7.18132854578097e-06,
488
+ "loss": 0.6266,
489
  "step": 800
490
  },
491
  {
492
  "epoch": 0.73,
493
  "learning_rate": 7.271095152603231e-06,
494
+ "loss": 0.6082,
495
  "step": 810
496
  },
497
  {
498
  "epoch": 0.74,
499
  "learning_rate": 7.360861759425494e-06,
500
+ "loss": 0.6194,
501
  "step": 820
502
  },
503
  {
504
  "epoch": 0.74,
505
  "learning_rate": 7.4506283662477555e-06,
506
+ "loss": 0.6277,
507
  "step": 830
508
  },
509
  {
510
  "epoch": 0.75,
511
  "learning_rate": 7.540394973070018e-06,
512
+ "loss": 0.609,
513
  "step": 840
514
  },
515
  {
516
  "epoch": 0.76,
517
  "learning_rate": 7.630161579892281e-06,
518
+ "loss": 0.6252,
519
  "step": 850
520
  },
521
  {
522
  "epoch": 0.77,
523
  "learning_rate": 7.719928186714543e-06,
524
+ "loss": 0.5813,
525
  "step": 860
526
  },
527
  {
528
  "epoch": 0.78,
529
  "learning_rate": 7.809694793536805e-06,
530
+ "loss": 0.5799,
531
  "step": 870
532
  },
533
  {
534
  "epoch": 0.79,
535
  "learning_rate": 7.899461400359067e-06,
536
+ "loss": 0.6398,
537
  "step": 880
538
  },
539
  {
540
  "epoch": 0.8,
541
  "learning_rate": 7.98922800718133e-06,
542
+ "loss": 0.5549,
543
  "step": 890
544
  },
545
  {
546
  "epoch": 0.81,
547
  "learning_rate": 8.07899461400359e-06,
548
+ "loss": 0.6023,
549
  "step": 900
550
  },
551
  {
552
  "epoch": 0.82,
553
  "learning_rate": 8.168761220825854e-06,
554
+ "loss": 0.582,
555
  "step": 910
556
  },
557
  {
558
  "epoch": 0.83,
559
  "learning_rate": 8.258527827648117e-06,
560
+ "loss": 0.544,
561
  "step": 920
562
  },
563
  {
564
  "epoch": 0.83,
565
  "learning_rate": 8.348294434470378e-06,
566
+ "loss": 0.5912,
567
  "step": 930
568
  },
569
  {
570
  "epoch": 0.84,
571
  "learning_rate": 8.43806104129264e-06,
572
+ "loss": 0.5461,
573
  "step": 940
574
  },
575
  {
576
  "epoch": 0.85,
577
  "learning_rate": 8.527827648114902e-06,
578
+ "loss": 0.5238,
579
  "step": 950
580
  },
581
  {
582
  "epoch": 0.86,
583
  "learning_rate": 8.617594254937165e-06,
584
+ "loss": 0.5558,
585
  "step": 960
586
  },
587
  {
588
  "epoch": 0.87,
589
  "learning_rate": 8.707360861759426e-06,
590
+ "loss": 0.5371,
591
  "step": 970
592
  },
593
  {
594
  "epoch": 0.88,
595
  "learning_rate": 8.797127468581689e-06,
596
+ "loss": 0.5529,
597
  "step": 980
598
  },
599
  {
600
  "epoch": 0.89,
601
  "learning_rate": 8.88689407540395e-06,
602
+ "loss": 0.5691,
603
  "step": 990
604
  },
605
  {
606
  "epoch": 0.9,
607
  "learning_rate": 8.976660682226211e-06,
608
+ "loss": 0.5567,
609
  "step": 1000
610
  },
611
  {
612
  "epoch": 0.91,
613
  "learning_rate": 9.066427289048474e-06,
614
+ "loss": 0.5135,
615
  "step": 1010
616
  },
617
  {
618
  "epoch": 0.92,
619
  "learning_rate": 9.156193895870736e-06,
620
+ "loss": 0.5099,
621
  "step": 1020
622
  },
623
  {
624
  "epoch": 0.92,
625
  "learning_rate": 9.245960502692998e-06,
626
+ "loss": 0.5422,
627
  "step": 1030
628
  },
629
  {
630
  "epoch": 0.93,
631
  "learning_rate": 9.33572710951526e-06,
632
+ "loss": 0.5106,
633
  "step": 1040
634
  },
635
  {
636
  "epoch": 0.94,
637
  "learning_rate": 9.425493716337523e-06,
638
+ "loss": 0.4892,
639
  "step": 1050
640
  },
641
  {
642
  "epoch": 0.95,
643
  "learning_rate": 9.515260323159784e-06,
644
+ "loss": 0.4541,
645
  "step": 1060
646
  },
647
  {
648
  "epoch": 0.96,
649
  "learning_rate": 9.605026929982047e-06,
650
+ "loss": 0.4675,
651
  "step": 1070
652
  },
653
  {
654
  "epoch": 0.97,
655
  "learning_rate": 9.694793536804308e-06,
656
+ "loss": 0.5123,
657
  "step": 1080
658
  },
659
  {
660
  "epoch": 0.98,
661
  "learning_rate": 9.784560143626571e-06,
662
+ "loss": 0.5089,
663
  "step": 1090
664
  },
665
  {
666
  "epoch": 0.99,
667
  "learning_rate": 9.874326750448834e-06,
668
+ "loss": 0.5233,
669
  "step": 1100
670
  },
671
  {
672
  "epoch": 1.0,
673
  "learning_rate": 9.964093357271095e-06,
674
+ "loss": 0.5622,
675
  "step": 1110
676
  },
677
  {
678
  "epoch": 1.0,
679
  "eval_accuracy": {
680
+ "accuracy": 0.8736263736263736
681
  },
682
  "eval_f1": {
683
+ "f1": 0.8653360894930927
684
  },
685
+ "eval_loss": 0.4108576774597168,
686
  "eval_precision": {
687
+ "precision": 0.8669392826942903
688
  },
689
  "eval_recall": {
690
+ "recall": 0.8641606609285752
691
  },
692
+ "eval_runtime": 236.9507,
693
+ "eval_samples_per_second": 75.273,
694
+ "eval_steps_per_second": 4.706,
695
  "step": 1114
696
  }
697
  ],
tmp-checkpoint-1114/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3394b871720811033add862f1e1383ca3790e6ab55972b19ed900a5d6b59c978
3
  size 4792
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c55fb57ba4dc2c9b2c813516c4846a21f1047b19b6cf48a97b9224ced523b9b
3
  size 4792
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3394b871720811033add862f1e1383ca3790e6ab55972b19ed900a5d6b59c978
3
  size 4792
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c55fb57ba4dc2c9b2c813516c4846a21f1047b19b6cf48a97b9224ced523b9b
3
  size 4792