Soulaimen commited on
Commit
cf30c5f
·
1 Parent(s): d9e456a

End of training

Browse files
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
- "epoch": 9.94,
3
- "eval_accuracy": 1.0,
4
- "eval_loss": 0.002956948010250926,
5
- "eval_runtime": 23.6672,
6
- "eval_samples_per_second": 34.943,
7
- "eval_steps_per_second": 4.394,
8
- "total_flos": 1.8367349154946929e+18,
9
- "train_loss": 0.10741477019407532,
10
- "train_runtime": 3799.865,
11
- "train_samples_per_second": 19.572,
12
- "train_steps_per_second": 0.347
13
  }
 
1
  {
2
+ "epoch": 4.97,
3
+ "eval_accuracy": 0.9966480446927374,
4
+ "eval_loss": 0.010998690500855446,
5
+ "eval_runtime": 22.8893,
6
+ "eval_samples_per_second": 39.101,
7
+ "eval_steps_per_second": 4.893,
8
+ "total_flos": 9.948639012864492e+17,
9
+ "train_loss": 0.1435624466075764,
10
+ "train_runtime": 3458.6134,
11
+ "train_samples_per_second": 11.641,
12
+ "train_steps_per_second": 0.207
13
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 9.94,
3
- "eval_accuracy": 1.0,
4
- "eval_loss": 0.002956948010250926,
5
- "eval_runtime": 23.6672,
6
- "eval_samples_per_second": 34.943,
7
- "eval_steps_per_second": 4.394
8
  }
 
1
  {
2
+ "epoch": 4.97,
3
+ "eval_accuracy": 0.9966480446927374,
4
+ "eval_loss": 0.010998690500855446,
5
+ "eval_runtime": 22.8893,
6
+ "eval_samples_per_second": 39.101,
7
+ "eval_steps_per_second": 4.893
8
  }
runs/May08_13-23-35_1ed587541f1e/events.out.tfevents.1683555751.1ed587541f1e.1694.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e324b03b56b1c7f5de352453b1d85c489c1b01fbd171289a65f020ed20267f00
3
+ size 411
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 9.94,
3
- "total_flos": 1.8367349154946929e+18,
4
- "train_loss": 0.10741477019407532,
5
- "train_runtime": 3799.865,
6
- "train_samples_per_second": 19.572,
7
- "train_steps_per_second": 0.347
8
  }
 
1
  {
2
+ "epoch": 4.97,
3
+ "total_flos": 9.948639012864492e+17,
4
+ "train_loss": 0.1435624466075764,
5
+ "train_runtime": 3458.6134,
6
+ "train_samples_per_second": 11.641,
7
+ "train_steps_per_second": 0.207
8
  }
trainer_state.json CHANGED
@@ -1,907 +1,496 @@
1
  {
2
- "best_metric": 1.0,
3
- "best_model_checkpoint": "swin-tiny-patch4-window7-224-LongSleeveCleanedData/checkpoint-930",
4
- "epoch": 9.935483870967742,
5
- "global_step": 1320,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
- "epoch": 0.08,
12
- "learning_rate": 3.571428571428572e-05,
13
- "loss": 1.0666,
14
  "step": 10
15
  },
16
  {
17
- "epoch": 0.15,
18
- "learning_rate": 4.9770290964777946e-05,
19
- "loss": 0.7487,
20
  "step": 20
21
  },
22
  {
23
- "epoch": 0.23,
24
- "learning_rate": 4.93874425727412e-05,
25
- "loss": 0.481,
26
  "step": 30
27
  },
28
  {
29
- "epoch": 0.3,
30
- "learning_rate": 4.900459418070444e-05,
31
- "loss": 0.351,
32
  "step": 40
33
  },
34
  {
35
- "epoch": 0.38,
36
- "learning_rate": 4.862174578866769e-05,
37
- "loss": 0.2594,
38
  "step": 50
39
  },
40
  {
41
- "epoch": 0.45,
42
- "learning_rate": 4.823889739663094e-05,
43
- "loss": 0.3307,
44
  "step": 60
45
  },
46
  {
47
- "epoch": 0.53,
48
- "learning_rate": 4.785604900459418e-05,
49
- "loss": 0.2245,
50
  "step": 70
51
  },
52
  {
53
- "epoch": 0.6,
54
- "learning_rate": 4.747320061255743e-05,
55
- "loss": 0.1778,
56
  "step": 80
57
  },
58
  {
59
- "epoch": 0.68,
60
- "learning_rate": 4.709035222052068e-05,
61
- "loss": 0.216,
62
  "step": 90
63
  },
64
  {
65
- "epoch": 0.75,
66
- "learning_rate": 4.670750382848392e-05,
67
- "loss": 0.1601,
68
  "step": 100
69
  },
70
  {
71
- "epoch": 0.83,
72
- "learning_rate": 4.632465543644717e-05,
73
- "loss": 0.2145,
74
  "step": 110
75
  },
76
  {
77
- "epoch": 0.9,
78
- "learning_rate": 4.594180704441042e-05,
79
- "loss": 0.2227,
80
  "step": 120
81
  },
82
  {
83
- "epoch": 0.98,
84
- "learning_rate": 4.555895865237366e-05,
85
- "loss": 0.1472,
86
  "step": 130
87
  },
88
  {
89
- "epoch": 0.99,
90
- "eval_accuracy": 0.9830713422007256,
91
- "eval_loss": 0.04599744826555252,
92
- "eval_runtime": 128.5076,
93
- "eval_samples_per_second": 6.435,
94
- "eval_steps_per_second": 0.809,
95
- "step": 132
96
  },
97
  {
98
- "epoch": 1.05,
99
- "learning_rate": 4.517611026033691e-05,
100
- "loss": 0.1663,
101
- "step": 140
 
 
 
102
  },
103
  {
104
- "epoch": 1.13,
105
- "learning_rate": 4.479326186830016e-05,
106
- "loss": 0.1108,
107
  "step": 150
108
  },
109
  {
110
- "epoch": 1.2,
111
- "learning_rate": 4.4410413476263404e-05,
112
- "loss": 0.1293,
113
  "step": 160
114
  },
115
  {
116
- "epoch": 1.28,
117
- "learning_rate": 4.402756508422665e-05,
118
- "loss": 0.1695,
119
  "step": 170
120
  },
121
  {
122
- "epoch": 1.35,
123
- "learning_rate": 4.36447166921899e-05,
124
- "loss": 0.1437,
125
  "step": 180
126
  },
127
  {
128
- "epoch": 1.43,
129
- "learning_rate": 4.3261868300153144e-05,
130
- "loss": 0.1342,
131
  "step": 190
132
  },
133
  {
134
- "epoch": 1.51,
135
- "learning_rate": 4.287901990811639e-05,
136
- "loss": 0.1243,
137
  "step": 200
138
  },
139
  {
140
- "epoch": 1.58,
141
- "learning_rate": 4.249617151607963e-05,
142
- "loss": 0.1295,
143
  "step": 210
144
  },
145
  {
146
- "epoch": 1.66,
147
- "learning_rate": 4.211332312404288e-05,
148
- "loss": 0.1061,
149
  "step": 220
150
  },
151
  {
152
- "epoch": 1.73,
153
- "learning_rate": 4.173047473200612e-05,
154
- "loss": 0.1433,
155
  "step": 230
156
  },
157
  {
158
- "epoch": 1.81,
159
- "learning_rate": 4.1347626339969374e-05,
160
- "loss": 0.167,
161
  "step": 240
162
  },
163
  {
164
- "epoch": 1.88,
165
- "learning_rate": 4.096477794793262e-05,
166
- "loss": 0.0885,
167
  "step": 250
168
  },
169
  {
170
- "epoch": 1.96,
171
- "learning_rate": 4.058192955589586e-05,
172
- "loss": 0.1171,
173
  "step": 260
174
  },
175
  {
176
- "epoch": 1.99,
177
- "eval_accuracy": 0.9903264812575574,
178
- "eval_loss": 0.021295879036188126,
179
- "eval_runtime": 22.6767,
180
- "eval_samples_per_second": 36.469,
181
- "eval_steps_per_second": 4.586,
182
- "step": 265
183
- },
184
- {
185
- "epoch": 2.03,
186
- "learning_rate": 4.0199081163859114e-05,
187
- "loss": 0.1212,
188
  "step": 270
189
  },
190
  {
191
- "epoch": 2.11,
192
- "learning_rate": 3.981623277182236e-05,
193
- "loss": 0.0869,
194
  "step": 280
195
  },
196
  {
197
- "epoch": 2.18,
198
- "learning_rate": 3.943338437978561e-05,
199
- "loss": 0.106,
 
 
 
 
 
 
 
 
 
200
  "step": 290
201
  },
202
  {
203
- "epoch": 2.26,
204
- "learning_rate": 3.9050535987748854e-05,
205
- "loss": 0.1024,
206
  "step": 300
207
  },
208
  {
209
- "epoch": 2.33,
210
- "learning_rate": 3.86676875957121e-05,
211
- "loss": 0.1124,
212
  "step": 310
213
  },
214
  {
215
- "epoch": 2.41,
216
- "learning_rate": 3.828483920367535e-05,
217
- "loss": 0.0942,
218
  "step": 320
219
  },
220
  {
221
- "epoch": 2.48,
222
- "learning_rate": 3.7901990811638595e-05,
223
- "loss": 0.1147,
224
  "step": 330
225
  },
226
  {
227
- "epoch": 2.56,
228
- "learning_rate": 3.751914241960184e-05,
229
- "loss": 0.0974,
230
  "step": 340
231
  },
232
  {
233
- "epoch": 2.63,
234
- "learning_rate": 3.713629402756509e-05,
235
- "loss": 0.0877,
236
  "step": 350
237
  },
238
  {
239
- "epoch": 2.71,
240
- "learning_rate": 3.6753445635528335e-05,
241
- "loss": 0.093,
242
  "step": 360
243
  },
244
  {
245
- "epoch": 2.78,
246
- "learning_rate": 3.637059724349158e-05,
247
- "loss": 0.0815,
248
  "step": 370
249
  },
250
  {
251
- "epoch": 2.86,
252
- "learning_rate": 3.598774885145483e-05,
253
- "loss": 0.083,
254
  "step": 380
255
  },
256
  {
257
- "epoch": 2.94,
258
- "learning_rate": 3.5604900459418075e-05,
259
- "loss": 0.133,
260
  "step": 390
261
  },
262
  {
263
- "epoch": 3.0,
264
- "eval_accuracy": 0.9975816203143894,
265
- "eval_loss": 0.007586946245282888,
266
- "eval_runtime": 21.2686,
267
- "eval_samples_per_second": 38.884,
268
- "eval_steps_per_second": 4.89,
269
- "step": 398
270
- },
271
- {
272
- "epoch": 3.01,
273
- "learning_rate": 3.522205206738132e-05,
274
- "loss": 0.1194,
275
  "step": 400
276
  },
277
  {
278
- "epoch": 3.09,
279
- "learning_rate": 3.4839203675344565e-05,
280
- "loss": 0.076,
281
  "step": 410
282
  },
283
  {
284
- "epoch": 3.16,
285
- "learning_rate": 3.445635528330781e-05,
286
- "loss": 0.1054,
287
  "step": 420
288
  },
289
  {
290
- "epoch": 3.24,
291
- "learning_rate": 3.4073506891271054e-05,
292
- "loss": 0.1116,
293
  "step": 430
294
  },
295
  {
296
- "epoch": 3.31,
297
- "learning_rate": 3.3690658499234305e-05,
298
- "loss": 0.0979,
 
 
 
 
 
 
 
 
 
299
  "step": 440
300
  },
301
  {
302
- "epoch": 3.39,
303
- "learning_rate": 3.330781010719755e-05,
304
- "loss": 0.0656,
305
  "step": 450
306
  },
307
  {
308
- "epoch": 3.46,
309
- "learning_rate": 3.2924961715160794e-05,
310
- "loss": 0.0599,
311
  "step": 460
312
  },
313
  {
314
- "epoch": 3.54,
315
- "learning_rate": 3.2542113323124045e-05,
316
- "loss": 0.0693,
317
  "step": 470
318
  },
319
  {
320
- "epoch": 3.61,
321
- "learning_rate": 3.215926493108729e-05,
322
- "loss": 0.1082,
323
  "step": 480
324
  },
325
  {
326
- "epoch": 3.69,
327
- "learning_rate": 3.1776416539050534e-05,
328
- "loss": 0.0696,
329
  "step": 490
330
  },
331
  {
332
- "epoch": 3.76,
333
- "learning_rate": 3.1393568147013786e-05,
334
- "loss": 0.0656,
335
  "step": 500
336
  },
337
  {
338
- "epoch": 3.84,
339
- "learning_rate": 3.101071975497703e-05,
340
- "loss": 0.0767,
341
  "step": 510
342
  },
343
  {
344
- "epoch": 3.91,
345
- "learning_rate": 3.0627871362940275e-05,
346
- "loss": 0.1195,
347
  "step": 520
348
  },
349
  {
350
- "epoch": 3.99,
351
- "learning_rate": 3.0245022970903526e-05,
352
- "loss": 0.0714,
353
  "step": 530
354
  },
355
  {
356
- "epoch": 4.0,
357
- "eval_accuracy": 0.9975816203143894,
358
- "eval_loss": 0.008087977766990662,
359
- "eval_runtime": 23.253,
360
- "eval_samples_per_second": 35.565,
361
- "eval_steps_per_second": 4.473,
362
- "step": 531
363
- },
364
- {
365
- "epoch": 4.06,
366
- "learning_rate": 2.986217457886677e-05,
367
- "loss": 0.1059,
368
  "step": 540
369
  },
370
  {
371
- "epoch": 4.14,
372
- "learning_rate": 2.9479326186830015e-05,
373
- "loss": 0.0458,
374
  "step": 550
375
  },
376
  {
377
- "epoch": 4.22,
378
- "learning_rate": 2.9096477794793263e-05,
379
- "loss": 0.0657,
380
  "step": 560
381
  },
382
  {
383
- "epoch": 4.29,
384
- "learning_rate": 2.8713629402756508e-05,
385
- "loss": 0.1046,
386
  "step": 570
387
  },
388
  {
389
- "epoch": 4.37,
390
- "learning_rate": 2.833078101071976e-05,
391
- "loss": 0.0963,
 
 
 
 
 
 
 
 
 
392
  "step": 580
393
  },
394
  {
395
- "epoch": 4.44,
396
- "learning_rate": 2.7947932618683003e-05,
397
- "loss": 0.0883,
398
  "step": 590
399
  },
400
  {
401
- "epoch": 4.52,
402
- "learning_rate": 2.7565084226646248e-05,
403
- "loss": 0.0713,
404
  "step": 600
405
  },
406
  {
407
- "epoch": 4.59,
408
- "learning_rate": 2.71822358346095e-05,
409
- "loss": 0.1307,
410
  "step": 610
411
  },
412
  {
413
- "epoch": 4.67,
414
- "learning_rate": 2.6799387442572744e-05,
415
- "loss": 0.0879,
416
  "step": 620
417
  },
418
  {
419
- "epoch": 4.74,
420
- "learning_rate": 2.6416539050535988e-05,
421
- "loss": 0.1203,
422
  "step": 630
423
  },
424
  {
425
- "epoch": 4.82,
426
- "learning_rate": 2.603369065849924e-05,
427
- "loss": 0.0743,
428
  "step": 640
429
  },
430
  {
431
- "epoch": 4.89,
432
- "learning_rate": 2.5650842266462484e-05,
433
- "loss": 0.0842,
434
  "step": 650
435
  },
436
  {
437
- "epoch": 4.97,
438
- "learning_rate": 2.526799387442573e-05,
439
- "loss": 0.0776,
440
  "step": 660
441
  },
442
  {
443
- "epoch": 5.0,
444
- "eval_accuracy": 0.9987908101571947,
445
- "eval_loss": 0.005263020750135183,
446
- "eval_runtime": 23.3335,
447
- "eval_samples_per_second": 35.443,
448
- "eval_steps_per_second": 4.457,
449
- "step": 664
450
- },
451
- {
452
- "epoch": 5.04,
453
- "learning_rate": 2.4885145482388973e-05,
454
- "loss": 0.1302,
455
  "step": 670
456
  },
457
  {
458
- "epoch": 5.12,
459
- "learning_rate": 2.450229709035222e-05,
460
- "loss": 0.0708,
461
  "step": 680
462
  },
463
  {
464
- "epoch": 5.19,
465
- "learning_rate": 2.411944869831547e-05,
466
- "loss": 0.0717,
467
  "step": 690
468
  },
469
  {
470
- "epoch": 5.27,
471
- "learning_rate": 2.3736600306278714e-05,
472
- "loss": 0.0932,
473
  "step": 700
474
  },
475
  {
476
- "epoch": 5.34,
477
- "learning_rate": 2.335375191424196e-05,
478
- "loss": 0.0895,
479
  "step": 710
480
  },
481
  {
482
- "epoch": 5.42,
483
- "learning_rate": 2.297090352220521e-05,
484
- "loss": 0.0572,
485
- "step": 720
486
- },
487
- {
488
- "epoch": 5.49,
489
- "learning_rate": 2.2588055130168454e-05,
490
- "loss": 0.0798,
491
- "step": 730
492
- },
493
- {
494
- "epoch": 5.57,
495
- "learning_rate": 2.2205206738131702e-05,
496
- "loss": 0.0588,
497
- "step": 740
498
- },
499
- {
500
- "epoch": 5.65,
501
- "learning_rate": 2.182235834609495e-05,
502
- "loss": 0.0785,
503
- "step": 750
504
- },
505
- {
506
- "epoch": 5.72,
507
- "learning_rate": 2.1439509954058194e-05,
508
- "loss": 0.0803,
509
- "step": 760
510
- },
511
- {
512
- "epoch": 5.8,
513
- "learning_rate": 2.105666156202144e-05,
514
- "loss": 0.0648,
515
- "step": 770
516
- },
517
- {
518
- "epoch": 5.87,
519
- "learning_rate": 2.0673813169984687e-05,
520
- "loss": 0.0589,
521
- "step": 780
522
- },
523
- {
524
- "epoch": 5.95,
525
- "learning_rate": 2.029096477794793e-05,
526
- "loss": 0.0812,
527
- "step": 790
528
- },
529
- {
530
- "epoch": 6.0,
531
- "eval_accuracy": 0.9975816203143894,
532
- "eval_loss": 0.004879950545728207,
533
- "eval_runtime": 22.7765,
534
- "eval_samples_per_second": 36.309,
535
- "eval_steps_per_second": 4.566,
536
- "step": 797
537
- },
538
- {
539
- "epoch": 6.02,
540
- "learning_rate": 1.990811638591118e-05,
541
- "loss": 0.0705,
542
- "step": 800
543
- },
544
- {
545
- "epoch": 6.1,
546
- "learning_rate": 1.9525267993874427e-05,
547
- "loss": 0.0651,
548
- "step": 810
549
- },
550
- {
551
- "epoch": 6.17,
552
- "learning_rate": 1.9142419601837675e-05,
553
- "loss": 0.0941,
554
- "step": 820
555
- },
556
- {
557
- "epoch": 6.25,
558
- "learning_rate": 1.875957120980092e-05,
559
- "loss": 0.0627,
560
- "step": 830
561
- },
562
- {
563
- "epoch": 6.32,
564
- "learning_rate": 1.8376722817764168e-05,
565
- "loss": 0.0868,
566
- "step": 840
567
- },
568
- {
569
- "epoch": 6.4,
570
- "learning_rate": 1.7993874425727415e-05,
571
- "loss": 0.066,
572
- "step": 850
573
- },
574
- {
575
- "epoch": 6.47,
576
- "learning_rate": 1.761102603369066e-05,
577
- "loss": 0.0453,
578
- "step": 860
579
- },
580
- {
581
- "epoch": 6.55,
582
- "learning_rate": 1.7228177641653905e-05,
583
- "loss": 0.0536,
584
- "step": 870
585
- },
586
- {
587
- "epoch": 6.62,
588
- "learning_rate": 1.6845329249617152e-05,
589
- "loss": 0.0723,
590
- "step": 880
591
- },
592
- {
593
- "epoch": 6.7,
594
- "learning_rate": 1.6462480857580397e-05,
595
- "loss": 0.0321,
596
- "step": 890
597
- },
598
- {
599
- "epoch": 6.77,
600
- "learning_rate": 1.6079632465543645e-05,
601
- "loss": 0.1033,
602
- "step": 900
603
- },
604
- {
605
- "epoch": 6.85,
606
- "learning_rate": 1.5696784073506893e-05,
607
- "loss": 0.0763,
608
- "step": 910
609
- },
610
- {
611
- "epoch": 6.92,
612
- "learning_rate": 1.5313935681470137e-05,
613
- "loss": 0.0601,
614
- "step": 920
615
- },
616
- {
617
- "epoch": 7.0,
618
- "learning_rate": 1.4931087289433385e-05,
619
- "loss": 0.0658,
620
- "step": 930
621
- },
622
- {
623
- "epoch": 7.0,
624
- "eval_accuracy": 1.0,
625
- "eval_loss": 0.002956948010250926,
626
- "eval_runtime": 22.0999,
627
- "eval_samples_per_second": 37.421,
628
- "eval_steps_per_second": 4.706,
629
- "step": 930
630
- },
631
- {
632
- "epoch": 7.08,
633
- "learning_rate": 1.4548238897396632e-05,
634
- "loss": 0.0685,
635
- "step": 940
636
- },
637
- {
638
- "epoch": 7.15,
639
- "learning_rate": 1.416539050535988e-05,
640
- "loss": 0.1036,
641
- "step": 950
642
- },
643
- {
644
- "epoch": 7.23,
645
- "learning_rate": 1.3782542113323124e-05,
646
- "loss": 0.0605,
647
- "step": 960
648
- },
649
- {
650
- "epoch": 7.3,
651
- "learning_rate": 1.3399693721286372e-05,
652
- "loss": 0.0671,
653
- "step": 970
654
- },
655
- {
656
- "epoch": 7.38,
657
- "learning_rate": 1.301684532924962e-05,
658
- "loss": 0.0579,
659
- "step": 980
660
- },
661
- {
662
- "epoch": 7.45,
663
- "learning_rate": 1.2633996937212864e-05,
664
- "loss": 0.0456,
665
- "step": 990
666
- },
667
- {
668
- "epoch": 7.53,
669
- "learning_rate": 1.225114854517611e-05,
670
- "loss": 0.0928,
671
- "step": 1000
672
- },
673
- {
674
- "epoch": 7.6,
675
- "learning_rate": 1.1868300153139357e-05,
676
- "loss": 0.0688,
677
- "step": 1010
678
- },
679
- {
680
- "epoch": 7.68,
681
- "learning_rate": 1.1485451761102605e-05,
682
- "loss": 0.0438,
683
- "step": 1020
684
- },
685
- {
686
- "epoch": 7.75,
687
- "learning_rate": 1.1102603369065851e-05,
688
- "loss": 0.0393,
689
- "step": 1030
690
- },
691
- {
692
- "epoch": 7.83,
693
- "learning_rate": 1.0719754977029097e-05,
694
- "loss": 0.074,
695
- "step": 1040
696
- },
697
- {
698
- "epoch": 7.9,
699
- "learning_rate": 1.0336906584992343e-05,
700
- "loss": 0.0597,
701
- "step": 1050
702
- },
703
- {
704
- "epoch": 7.98,
705
- "learning_rate": 9.95405819295559e-06,
706
- "loss": 0.0804,
707
- "step": 1060
708
- },
709
- {
710
- "epoch": 7.99,
711
- "eval_accuracy": 0.9975816203143894,
712
- "eval_loss": 0.0034685195423662663,
713
- "eval_runtime": 22.3239,
714
- "eval_samples_per_second": 37.045,
715
- "eval_steps_per_second": 4.659,
716
- "step": 1062
717
- },
718
- {
719
- "epoch": 8.05,
720
- "learning_rate": 9.571209800918838e-06,
721
- "loss": 0.0558,
722
- "step": 1070
723
- },
724
- {
725
- "epoch": 8.13,
726
- "learning_rate": 9.188361408882084e-06,
727
- "loss": 0.0275,
728
- "step": 1080
729
- },
730
- {
731
- "epoch": 8.2,
732
- "learning_rate": 8.80551301684533e-06,
733
- "loss": 0.0325,
734
- "step": 1090
735
- },
736
- {
737
- "epoch": 8.28,
738
- "learning_rate": 8.422664624808576e-06,
739
- "loss": 0.0652,
740
- "step": 1100
741
- },
742
- {
743
- "epoch": 8.35,
744
- "learning_rate": 8.039816232771822e-06,
745
- "loss": 0.0559,
746
- "step": 1110
747
- },
748
- {
749
- "epoch": 8.43,
750
- "learning_rate": 7.656967840735069e-06,
751
- "loss": 0.0509,
752
- "step": 1120
753
- },
754
- {
755
- "epoch": 8.51,
756
- "learning_rate": 7.274119448698316e-06,
757
- "loss": 0.0698,
758
- "step": 1130
759
- },
760
- {
761
- "epoch": 8.58,
762
- "learning_rate": 6.891271056661562e-06,
763
- "loss": 0.0676,
764
- "step": 1140
765
- },
766
- {
767
- "epoch": 8.66,
768
- "learning_rate": 6.50842266462481e-06,
769
- "loss": 0.0435,
770
- "step": 1150
771
- },
772
- {
773
- "epoch": 8.73,
774
- "learning_rate": 6.125574272588055e-06,
775
- "loss": 0.0535,
776
- "step": 1160
777
- },
778
- {
779
- "epoch": 8.81,
780
- "learning_rate": 5.742725880551302e-06,
781
- "loss": 0.0499,
782
- "step": 1170
783
- },
784
- {
785
- "epoch": 8.88,
786
- "learning_rate": 5.359877488514549e-06,
787
- "loss": 0.0419,
788
- "step": 1180
789
- },
790
- {
791
- "epoch": 8.96,
792
- "learning_rate": 4.977029096477795e-06,
793
- "loss": 0.0508,
794
- "step": 1190
795
- },
796
- {
797
- "epoch": 8.99,
798
- "eval_accuracy": 1.0,
799
- "eval_loss": 0.0011118645779788494,
800
- "eval_runtime": 22.2701,
801
- "eval_samples_per_second": 37.135,
802
- "eval_steps_per_second": 4.67,
803
- "step": 1195
804
- },
805
- {
806
- "epoch": 9.03,
807
- "learning_rate": 4.594180704441042e-06,
808
- "loss": 0.054,
809
- "step": 1200
810
- },
811
- {
812
- "epoch": 9.11,
813
- "learning_rate": 4.211332312404288e-06,
814
- "loss": 0.0596,
815
- "step": 1210
816
- },
817
- {
818
- "epoch": 9.18,
819
- "learning_rate": 3.828483920367534e-06,
820
- "loss": 0.0435,
821
- "step": 1220
822
- },
823
- {
824
- "epoch": 9.26,
825
- "learning_rate": 3.445635528330781e-06,
826
- "loss": 0.0677,
827
- "step": 1230
828
- },
829
- {
830
- "epoch": 9.33,
831
- "learning_rate": 3.0627871362940276e-06,
832
- "loss": 0.0548,
833
- "step": 1240
834
- },
835
- {
836
- "epoch": 9.41,
837
- "learning_rate": 2.6799387442572743e-06,
838
- "loss": 0.0587,
839
- "step": 1250
840
- },
841
- {
842
- "epoch": 9.48,
843
- "learning_rate": 2.297090352220521e-06,
844
- "loss": 0.0382,
845
- "step": 1260
846
- },
847
- {
848
- "epoch": 9.56,
849
- "learning_rate": 1.914241960183767e-06,
850
- "loss": 0.0443,
851
- "step": 1270
852
- },
853
- {
854
- "epoch": 9.63,
855
- "learning_rate": 1.5313935681470138e-06,
856
- "loss": 0.0386,
857
- "step": 1280
858
- },
859
- {
860
- "epoch": 9.71,
861
- "learning_rate": 1.1485451761102605e-06,
862
- "loss": 0.0362,
863
- "step": 1290
864
- },
865
- {
866
- "epoch": 9.78,
867
- "learning_rate": 7.656967840735069e-07,
868
- "loss": 0.0478,
869
- "step": 1300
870
- },
871
- {
872
- "epoch": 9.86,
873
- "learning_rate": 3.8284839203675346e-07,
874
- "loss": 0.055,
875
- "step": 1310
876
- },
877
- {
878
- "epoch": 9.94,
879
- "learning_rate": 0.0,
880
- "loss": 0.0725,
881
- "step": 1320
882
- },
883
- {
884
- "epoch": 9.94,
885
- "eval_accuracy": 1.0,
886
- "eval_loss": 0.0010892293648794293,
887
- "eval_runtime": 22.2717,
888
- "eval_samples_per_second": 37.132,
889
- "eval_steps_per_second": 4.67,
890
- "step": 1320
891
  },
892
  {
893
- "epoch": 9.94,
894
- "step": 1320,
895
- "total_flos": 1.8367349154946929e+18,
896
- "train_loss": 0.10741477019407532,
897
- "train_runtime": 3799.865,
898
- "train_samples_per_second": 19.572,
899
- "train_steps_per_second": 0.347
900
  }
901
  ],
902
- "max_steps": 1320,
903
- "num_train_epochs": 10,
904
- "total_flos": 1.8367349154946929e+18,
905
  "trial_name": null,
906
  "trial_params": null
907
  }
 
1
  {
2
+ "best_metric": 0.9966480446927374,
3
+ "best_model_checkpoint": "swin-tiny-patch4-window7-224-LongSleeveCleanedData/checkpoint-575",
4
+ "epoch": 4.97020854021847,
5
+ "global_step": 715,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
+ "epoch": 0.07,
12
+ "learning_rate": 4.985855728429986e-05,
13
+ "loss": 1.0641,
14
  "step": 10
15
  },
16
  {
17
+ "epoch": 0.14,
18
+ "learning_rate": 4.915134370579915e-05,
19
+ "loss": 0.7318,
20
  "step": 20
21
  },
22
  {
23
+ "epoch": 0.21,
24
+ "learning_rate": 4.844413012729845e-05,
25
+ "loss": 0.4442,
26
  "step": 30
27
  },
28
  {
29
+ "epoch": 0.28,
30
+ "learning_rate": 4.773691654879774e-05,
31
+ "loss": 0.38,
32
  "step": 40
33
  },
34
  {
35
+ "epoch": 0.35,
36
+ "learning_rate": 4.702970297029703e-05,
37
+ "loss": 0.2757,
38
  "step": 50
39
  },
40
  {
41
+ "epoch": 0.42,
42
+ "learning_rate": 4.632248939179633e-05,
43
+ "loss": 0.2418,
44
  "step": 60
45
  },
46
  {
47
+ "epoch": 0.49,
48
+ "learning_rate": 4.561527581329561e-05,
49
+ "loss": 0.2242,
50
  "step": 70
51
  },
52
  {
53
+ "epoch": 0.56,
54
+ "learning_rate": 4.490806223479491e-05,
55
+ "loss": 0.2094,
56
  "step": 80
57
  },
58
  {
59
+ "epoch": 0.63,
60
+ "learning_rate": 4.42008486562942e-05,
61
+ "loss": 0.2175,
62
  "step": 90
63
  },
64
  {
65
+ "epoch": 0.7,
66
+ "learning_rate": 4.3493635077793494e-05,
67
+ "loss": 0.1794,
68
  "step": 100
69
  },
70
  {
71
+ "epoch": 0.76,
72
+ "learning_rate": 4.278642149929279e-05,
73
+ "loss": 0.147,
74
  "step": 110
75
  },
76
  {
77
+ "epoch": 0.83,
78
+ "learning_rate": 4.207920792079208e-05,
79
+ "loss": 0.1538,
80
  "step": 120
81
  },
82
  {
83
+ "epoch": 0.9,
84
+ "learning_rate": 4.1371994342291374e-05,
85
+ "loss": 0.1365,
86
  "step": 130
87
  },
88
  {
89
+ "epoch": 0.97,
90
+ "learning_rate": 4.0664780763790665e-05,
91
+ "loss": 0.1802,
92
+ "step": 140
 
 
 
93
  },
94
  {
95
+ "epoch": 0.99,
96
+ "eval_accuracy": 0.9597765363128492,
97
+ "eval_loss": 0.1150519847869873,
98
+ "eval_runtime": 220.0966,
99
+ "eval_samples_per_second": 4.066,
100
+ "eval_steps_per_second": 0.509,
101
+ "step": 143
102
  },
103
  {
104
+ "epoch": 1.04,
105
+ "learning_rate": 3.9957567185289956e-05,
106
+ "loss": 0.1855,
107
  "step": 150
108
  },
109
  {
110
+ "epoch": 1.11,
111
+ "learning_rate": 3.9250353606789254e-05,
112
+ "loss": 0.1416,
113
  "step": 160
114
  },
115
  {
116
+ "epoch": 1.18,
117
+ "learning_rate": 3.8543140028288545e-05,
118
+ "loss": 0.1621,
119
  "step": 170
120
  },
121
  {
122
+ "epoch": 1.25,
123
+ "learning_rate": 3.783592644978784e-05,
124
+ "loss": 0.1769,
125
  "step": 180
126
  },
127
  {
128
+ "epoch": 1.32,
129
+ "learning_rate": 3.712871287128713e-05,
130
+ "loss": 0.1404,
131
  "step": 190
132
  },
133
  {
134
+ "epoch": 1.39,
135
+ "learning_rate": 3.642149929278642e-05,
136
+ "loss": 0.139,
137
  "step": 200
138
  },
139
  {
140
+ "epoch": 1.46,
141
+ "learning_rate": 3.571428571428572e-05,
142
+ "loss": 0.138,
143
  "step": 210
144
  },
145
  {
146
+ "epoch": 1.53,
147
+ "learning_rate": 3.500707213578501e-05,
148
+ "loss": 0.1705,
149
  "step": 220
150
  },
151
  {
152
+ "epoch": 1.6,
153
+ "learning_rate": 3.4299858557284306e-05,
154
+ "loss": 0.1272,
155
  "step": 230
156
  },
157
  {
158
+ "epoch": 1.67,
159
+ "learning_rate": 3.35926449787836e-05,
160
+ "loss": 0.1326,
161
  "step": 240
162
  },
163
  {
164
+ "epoch": 1.74,
165
+ "learning_rate": 3.288543140028288e-05,
166
+ "loss": 0.1268,
167
  "step": 250
168
  },
169
  {
170
+ "epoch": 1.81,
171
+ "learning_rate": 3.217821782178218e-05,
172
+ "loss": 0.1383,
173
  "step": 260
174
  },
175
  {
176
+ "epoch": 1.88,
177
+ "learning_rate": 3.147100424328147e-05,
178
+ "loss": 0.1043,
 
 
 
 
 
 
 
 
 
179
  "step": 270
180
  },
181
  {
182
+ "epoch": 1.95,
183
+ "learning_rate": 3.076379066478077e-05,
184
+ "loss": 0.0836,
185
  "step": 280
186
  },
187
  {
188
+ "epoch": 2.0,
189
+ "eval_accuracy": 0.994413407821229,
190
+ "eval_loss": 0.020183874294161797,
191
+ "eval_runtime": 22.3499,
192
+ "eval_samples_per_second": 40.045,
193
+ "eval_steps_per_second": 5.011,
194
+ "step": 287
195
+ },
196
+ {
197
+ "epoch": 2.02,
198
+ "learning_rate": 3.0056577086280057e-05,
199
+ "loss": 0.0581,
200
  "step": 290
201
  },
202
  {
203
+ "epoch": 2.09,
204
+ "learning_rate": 2.9349363507779348e-05,
205
+ "loss": 0.1456,
206
  "step": 300
207
  },
208
  {
209
+ "epoch": 2.15,
210
+ "learning_rate": 2.8642149929278646e-05,
211
+ "loss": 0.1157,
212
  "step": 310
213
  },
214
  {
215
+ "epoch": 2.22,
216
+ "learning_rate": 2.7934936350777934e-05,
217
+ "loss": 0.1005,
218
  "step": 320
219
  },
220
  {
221
+ "epoch": 2.29,
222
+ "learning_rate": 2.722772277227723e-05,
223
+ "loss": 0.0868,
224
  "step": 330
225
  },
226
  {
227
+ "epoch": 2.36,
228
+ "learning_rate": 2.6520509193776523e-05,
229
+ "loss": 0.1223,
230
  "step": 340
231
  },
232
  {
233
+ "epoch": 2.43,
234
+ "learning_rate": 2.581329561527581e-05,
235
+ "loss": 0.1164,
236
  "step": 350
237
  },
238
  {
239
+ "epoch": 2.5,
240
+ "learning_rate": 2.510608203677511e-05,
241
+ "loss": 0.081,
242
  "step": 360
243
  },
244
  {
245
+ "epoch": 2.57,
246
+ "learning_rate": 2.43988684582744e-05,
247
+ "loss": 0.076,
248
  "step": 370
249
  },
250
  {
251
+ "epoch": 2.64,
252
+ "learning_rate": 2.369165487977369e-05,
253
+ "loss": 0.0827,
254
  "step": 380
255
  },
256
  {
257
+ "epoch": 2.71,
258
+ "learning_rate": 2.2984441301272985e-05,
259
+ "loss": 0.0734,
260
  "step": 390
261
  },
262
  {
263
+ "epoch": 2.78,
264
+ "learning_rate": 2.227722772277228e-05,
265
+ "loss": 0.1122,
 
 
 
 
 
 
 
 
 
266
  "step": 400
267
  },
268
  {
269
+ "epoch": 2.85,
270
+ "learning_rate": 2.157001414427157e-05,
271
+ "loss": 0.1241,
272
  "step": 410
273
  },
274
  {
275
+ "epoch": 2.92,
276
+ "learning_rate": 2.0862800565770862e-05,
277
+ "loss": 0.1051,
278
  "step": 420
279
  },
280
  {
281
+ "epoch": 2.99,
282
+ "learning_rate": 2.0155586987270157e-05,
283
+ "loss": 0.1186,
284
  "step": 430
285
  },
286
  {
287
+ "epoch": 3.0,
288
+ "eval_accuracy": 0.994413407821229,
289
+ "eval_loss": 0.01652395911514759,
290
+ "eval_runtime": 23.7611,
291
+ "eval_samples_per_second": 37.667,
292
+ "eval_steps_per_second": 4.714,
293
+ "step": 431
294
+ },
295
+ {
296
+ "epoch": 3.06,
297
+ "learning_rate": 1.9448373408769448e-05,
298
+ "loss": 0.0954,
299
  "step": 440
300
  },
301
  {
302
+ "epoch": 3.13,
303
+ "learning_rate": 1.8741159830268743e-05,
304
+ "loss": 0.066,
305
  "step": 450
306
  },
307
  {
308
+ "epoch": 3.2,
309
+ "learning_rate": 1.8033946251768037e-05,
310
+ "loss": 0.1178,
311
  "step": 460
312
  },
313
  {
314
+ "epoch": 3.27,
315
+ "learning_rate": 1.7326732673267325e-05,
316
+ "loss": 0.091,
317
  "step": 470
318
  },
319
  {
320
+ "epoch": 3.34,
321
+ "learning_rate": 1.661951909476662e-05,
322
+ "loss": 0.0954,
323
  "step": 480
324
  },
325
  {
326
+ "epoch": 3.41,
327
+ "learning_rate": 1.5912305516265914e-05,
328
+ "loss": 0.0845,
329
  "step": 490
330
  },
331
  {
332
+ "epoch": 3.48,
333
+ "learning_rate": 1.5205091937765206e-05,
334
+ "loss": 0.0953,
335
  "step": 500
336
  },
337
  {
338
+ "epoch": 3.55,
339
+ "learning_rate": 1.44978783592645e-05,
340
+ "loss": 0.108,
341
  "step": 510
342
  },
343
  {
344
+ "epoch": 3.61,
345
+ "learning_rate": 1.379066478076379e-05,
346
+ "loss": 0.0578,
347
  "step": 520
348
  },
349
  {
350
+ "epoch": 3.68,
351
+ "learning_rate": 1.3083451202263084e-05,
352
+ "loss": 0.1044,
353
  "step": 530
354
  },
355
  {
356
+ "epoch": 3.75,
357
+ "learning_rate": 1.2376237623762377e-05,
358
+ "loss": 0.0842,
 
 
 
 
 
 
 
 
 
359
  "step": 540
360
  },
361
  {
362
+ "epoch": 3.82,
363
+ "learning_rate": 1.166902404526167e-05,
364
+ "loss": 0.0716,
365
  "step": 550
366
  },
367
  {
368
+ "epoch": 3.89,
369
+ "learning_rate": 1.0961810466760961e-05,
370
+ "loss": 0.0739,
371
  "step": 560
372
  },
373
  {
374
+ "epoch": 3.96,
375
+ "learning_rate": 1.0254596888260256e-05,
376
+ "loss": 0.08,
377
  "step": 570
378
  },
379
  {
380
+ "epoch": 4.0,
381
+ "eval_accuracy": 0.9966480446927374,
382
+ "eval_loss": 0.010998690500855446,
383
+ "eval_runtime": 23.7024,
384
+ "eval_samples_per_second": 37.76,
385
+ "eval_steps_per_second": 4.725,
386
+ "step": 575
387
+ },
388
+ {
389
+ "epoch": 4.03,
390
+ "learning_rate": 9.547383309759547e-06,
391
+ "loss": 0.0684,
392
  "step": 580
393
  },
394
  {
395
+ "epoch": 4.1,
396
+ "learning_rate": 8.84016973125884e-06,
397
+ "loss": 0.0694,
398
  "step": 590
399
  },
400
  {
401
+ "epoch": 4.17,
402
+ "learning_rate": 8.132956152758134e-06,
403
+ "loss": 0.0663,
404
  "step": 600
405
  },
406
  {
407
+ "epoch": 4.24,
408
+ "learning_rate": 7.4257425742574256e-06,
409
+ "loss": 0.0694,
410
  "step": 610
411
  },
412
  {
413
+ "epoch": 4.31,
414
+ "learning_rate": 6.718528995756719e-06,
415
+ "loss": 0.0776,
416
  "step": 620
417
  },
418
  {
419
+ "epoch": 4.38,
420
+ "learning_rate": 6.011315417256011e-06,
421
+ "loss": 0.0785,
422
  "step": 630
423
  },
424
  {
425
+ "epoch": 4.45,
426
+ "learning_rate": 5.304101838755304e-06,
427
+ "loss": 0.0773,
428
  "step": 640
429
  },
430
  {
431
+ "epoch": 4.52,
432
+ "learning_rate": 4.596888260254597e-06,
433
+ "loss": 0.06,
434
  "step": 650
435
  },
436
  {
437
+ "epoch": 4.59,
438
+ "learning_rate": 3.889674681753889e-06,
439
+ "loss": 0.0647,
440
  "step": 660
441
  },
442
  {
443
+ "epoch": 4.66,
444
+ "learning_rate": 3.182461103253183e-06,
445
+ "loss": 0.0821,
 
 
 
 
 
 
 
 
 
446
  "step": 670
447
  },
448
  {
449
+ "epoch": 4.73,
450
+ "learning_rate": 2.4752475247524753e-06,
451
+ "loss": 0.0589,
452
  "step": 680
453
  },
454
  {
455
+ "epoch": 4.8,
456
+ "learning_rate": 1.768033946251768e-06,
457
+ "loss": 0.0604,
458
  "step": 690
459
  },
460
  {
461
+ "epoch": 4.87,
462
+ "learning_rate": 1.0608203677510609e-06,
463
+ "loss": 0.0413,
464
  "step": 700
465
  },
466
  {
467
+ "epoch": 4.94,
468
+ "learning_rate": 3.536067892503536e-07,
469
+ "loss": 0.0575,
470
  "step": 710
471
  },
472
  {
473
+ "epoch": 4.97,
474
+ "eval_accuracy": 0.9955307262569832,
475
+ "eval_loss": 0.012482840567827225,
476
+ "eval_runtime": 24.0149,
477
+ "eval_samples_per_second": 37.269,
478
+ "eval_steps_per_second": 4.664,
479
+ "step": 715
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
480
  },
481
  {
482
+ "epoch": 4.97,
483
+ "step": 715,
484
+ "total_flos": 9.948639012864492e+17,
485
+ "train_loss": 0.1435624466075764,
486
+ "train_runtime": 3458.6134,
487
+ "train_samples_per_second": 11.641,
488
+ "train_steps_per_second": 0.207
489
  }
490
  ],
491
+ "max_steps": 715,
492
+ "num_train_epochs": 5,
493
+ "total_flos": 9.948639012864492e+17,
494
  "trial_name": null,
495
  "trial_params": null
496
  }