faridkarimli commited on
Commit
e7be466
1 Parent(s): cde26d8

End of training

Browse files
Files changed (6) hide show
  1. README.md +3 -1
  2. all_results.json +12 -0
  3. config.json +1 -0
  4. eval_results.json +8 -0
  5. train_results.json +7 -0
  6. trainer_state.json +424 -0
README.md CHANGED
@@ -2,6 +2,8 @@
2
  license: apache-2.0
3
  base_model: microsoft/swinv2-base-patch4-window12-192-22k
4
  tags:
 
 
5
  - generated_from_trainer
6
  metrics:
7
  - accuracy
@@ -17,8 +19,8 @@ should probably proofread and complete it, then remove this comment. -->
17
 
18
  This model is a fine-tuned version of [microsoft/swinv2-base-patch4-window12-192-22k](https://huggingface.co/microsoft/swinv2-base-patch4-window12-192-22k) on an unknown dataset.
19
  It achieves the following results on the evaluation set:
20
- - Accuracy: 0.6785
21
  - Loss: 1.9857
 
22
 
23
  ## Model description
24
 
 
2
  license: apache-2.0
3
  base_model: microsoft/swinv2-base-patch4-window12-192-22k
4
  tags:
5
+ - image-classification
6
+ - vision
7
  - generated_from_trainer
8
  metrics:
9
  - accuracy
 
19
 
20
  This model is a fine-tuned version of [microsoft/swinv2-base-patch4-window12-192-22k](https://huggingface.co/microsoft/swinv2-base-patch4-window12-192-22k) on an unknown dataset.
21
  It achieves the following results on the evaluation set:
 
22
  - Loss: 1.9857
23
+ - Accuracy: 0.6785
24
 
25
  ## Model description
26
 
all_results.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 16.0,
3
+ "eval_accuracy": 0.6784972165163288,
4
+ "eval_loss": 1.9857261180877686,
5
+ "eval_runtime": 4657.9109,
6
+ "eval_samples_per_second": 36.058,
7
+ "eval_steps_per_second": 0.071,
8
+ "train_loss": 0.0,
9
+ "train_runtime": 372.6046,
10
+ "train_samples_per_second": 27045.44,
11
+ "train_steps_per_second": 52.858
12
+ }
config.json CHANGED
@@ -31044,6 +31044,7 @@
31044
  0,
31045
  0
31046
  ],
 
31047
  "qkv_bias": true,
31048
  "torch_dtype": "float32",
31049
  "transformers_version": "4.33.3",
 
31044
  0,
31045
  0
31046
  ],
31047
+ "problem_type": "single_label_classification",
31048
  "qkv_bias": true,
31049
  "torch_dtype": "float32",
31050
  "transformers_version": "4.33.3",
eval_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 16.0,
3
+ "eval_accuracy": 0.6784972165163288,
4
+ "eval_loss": 1.9857261180877686,
5
+ "eval_runtime": 4657.9109,
6
+ "eval_samples_per_second": 36.058,
7
+ "eval_steps_per_second": 0.071
8
+ }
train_results.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 16.0,
3
+ "train_loss": 0.0,
4
+ "train_runtime": 372.6046,
5
+ "train_samples_per_second": 27045.44,
6
+ "train_steps_per_second": 52.858
7
+ }
trainer_state.json ADDED
@@ -0,0 +1,424 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 16.0,
5
+ "eval_steps": 500,
6
+ "global_step": 21008,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.38,
13
+ "learning_rate": 0.0009873064229499874,
14
+ "loss": 2.3443,
15
+ "step": 500
16
+ },
17
+ {
18
+ "epoch": 0.76,
19
+ "learning_rate": 0.0009746128458999747,
20
+ "loss": 1.6863,
21
+ "step": 1000
22
+ },
23
+ {
24
+ "epoch": 1.0,
25
+ "eval_accuracy": 0.575725640796642,
26
+ "eval_loss": 1.955936312675476,
27
+ "eval_runtime": 2249.8295,
28
+ "eval_samples_per_second": 74.652,
29
+ "eval_steps_per_second": 0.146,
30
+ "step": 1313
31
+ },
32
+ {
33
+ "epoch": 1.14,
34
+ "learning_rate": 0.0009619192688499619,
35
+ "loss": 1.4821,
36
+ "step": 1500
37
+ },
38
+ {
39
+ "epoch": 1.52,
40
+ "learning_rate": 0.0009492256917999492,
41
+ "loss": 1.3492,
42
+ "step": 2000
43
+ },
44
+ {
45
+ "epoch": 1.9,
46
+ "learning_rate": 0.0009365321147499366,
47
+ "loss": 1.3275,
48
+ "step": 2500
49
+ },
50
+ {
51
+ "epoch": 2.0,
52
+ "eval_accuracy": 0.606090917209967,
53
+ "eval_loss": 1.8276444673538208,
54
+ "eval_runtime": 1553.5911,
55
+ "eval_samples_per_second": 108.108,
56
+ "eval_steps_per_second": 0.212,
57
+ "step": 2626
58
+ },
59
+ {
60
+ "epoch": 2.28,
61
+ "learning_rate": 0.0009238385376999238,
62
+ "loss": 1.1767,
63
+ "step": 3000
64
+ },
65
+ {
66
+ "epoch": 2.67,
67
+ "learning_rate": 0.0009111449606499112,
68
+ "loss": 1.151,
69
+ "step": 3500
70
+ },
71
+ {
72
+ "epoch": 3.0,
73
+ "eval_accuracy": 0.6130332529546605,
74
+ "eval_loss": 1.885665774345398,
75
+ "eval_runtime": 1611.9735,
76
+ "eval_samples_per_second": 104.192,
77
+ "eval_steps_per_second": 0.204,
78
+ "step": 3939
79
+ },
80
+ {
81
+ "epoch": 3.05,
82
+ "learning_rate": 0.0008984513835998985,
83
+ "loss": 1.1393,
84
+ "step": 4000
85
+ },
86
+ {
87
+ "epoch": 3.43,
88
+ "learning_rate": 0.0008857578065498858,
89
+ "loss": 1.0116,
90
+ "step": 4500
91
+ },
92
+ {
93
+ "epoch": 3.81,
94
+ "learning_rate": 0.0008730642294998731,
95
+ "loss": 1.0336,
96
+ "step": 5000
97
+ },
98
+ {
99
+ "epoch": 4.0,
100
+ "eval_accuracy": 0.6322288708284958,
101
+ "eval_loss": 1.8160221576690674,
102
+ "eval_runtime": 1568.2238,
103
+ "eval_samples_per_second": 107.099,
104
+ "eval_steps_per_second": 0.21,
105
+ "step": 5252
106
+ },
107
+ {
108
+ "epoch": 4.19,
109
+ "learning_rate": 0.0008603706524498604,
110
+ "loss": 0.9722,
111
+ "step": 5500
112
+ },
113
+ {
114
+ "epoch": 4.57,
115
+ "learning_rate": 0.0008476770753998477,
116
+ "loss": 0.9309,
117
+ "step": 6000
118
+ },
119
+ {
120
+ "epoch": 4.95,
121
+ "learning_rate": 0.000834983498349835,
122
+ "loss": 0.947,
123
+ "step": 6500
124
+ },
125
+ {
126
+ "epoch": 5.0,
127
+ "eval_accuracy": 0.6317465987913429,
128
+ "eval_loss": 1.8050605058670044,
129
+ "eval_runtime": 1542.405,
130
+ "eval_samples_per_second": 108.892,
131
+ "eval_steps_per_second": 0.213,
132
+ "step": 6565
133
+ },
134
+ {
135
+ "epoch": 5.33,
136
+ "learning_rate": 0.0008222899212998223,
137
+ "loss": 0.8427,
138
+ "step": 7000
139
+ },
140
+ {
141
+ "epoch": 5.71,
142
+ "learning_rate": 0.0008095963442498096,
143
+ "loss": 0.8595,
144
+ "step": 7500
145
+ },
146
+ {
147
+ "epoch": 6.0,
148
+ "eval_accuracy": 0.6442737638057813,
149
+ "eval_loss": 1.7996306419372559,
150
+ "eval_runtime": 1561.8382,
151
+ "eval_samples_per_second": 107.537,
152
+ "eval_steps_per_second": 0.211,
153
+ "step": 7878
154
+ },
155
+ {
156
+ "epoch": 6.09,
157
+ "learning_rate": 0.0007969027671997969,
158
+ "loss": 0.8393,
159
+ "step": 8000
160
+ },
161
+ {
162
+ "epoch": 6.47,
163
+ "learning_rate": 0.0007842091901497842,
164
+ "loss": 0.7719,
165
+ "step": 8500
166
+ },
167
+ {
168
+ "epoch": 6.85,
169
+ "learning_rate": 0.0007715156130997715,
170
+ "loss": 0.801,
171
+ "step": 9000
172
+ },
173
+ {
174
+ "epoch": 7.0,
175
+ "eval_accuracy": 0.6533952546813134,
176
+ "eval_loss": 1.7987133264541626,
177
+ "eval_runtime": 1549.5067,
178
+ "eval_samples_per_second": 108.393,
179
+ "eval_steps_per_second": 0.212,
180
+ "step": 9191
181
+ },
182
+ {
183
+ "epoch": 7.24,
184
+ "learning_rate": 0.0007588220360497588,
185
+ "loss": 0.7443,
186
+ "step": 9500
187
+ },
188
+ {
189
+ "epoch": 7.62,
190
+ "learning_rate": 0.0007461284589997462,
191
+ "loss": 0.7296,
192
+ "step": 10000
193
+ },
194
+ {
195
+ "epoch": 8.0,
196
+ "learning_rate": 0.0007334348819497334,
197
+ "loss": 0.7508,
198
+ "step": 10500
199
+ },
200
+ {
201
+ "epoch": 8.0,
202
+ "eval_accuracy": 0.6521925515763151,
203
+ "eval_loss": 1.7864270210266113,
204
+ "eval_runtime": 1567.4501,
205
+ "eval_samples_per_second": 107.152,
206
+ "eval_steps_per_second": 0.21,
207
+ "step": 10504
208
+ },
209
+ {
210
+ "epoch": 8.38,
211
+ "learning_rate": 0.0007207413048997208,
212
+ "loss": 0.6659,
213
+ "step": 11000
214
+ },
215
+ {
216
+ "epoch": 8.76,
217
+ "learning_rate": 0.0007080477278497081,
218
+ "loss": 0.694,
219
+ "step": 11500
220
+ },
221
+ {
222
+ "epoch": 9.0,
223
+ "eval_accuracy": 0.6525795600011908,
224
+ "eval_loss": 1.8871492147445679,
225
+ "eval_runtime": 1630.371,
226
+ "eval_samples_per_second": 103.016,
227
+ "eval_steps_per_second": 0.202,
228
+ "step": 11817
229
+ },
230
+ {
231
+ "epoch": 9.14,
232
+ "learning_rate": 0.0006953541507996953,
233
+ "loss": 0.6611,
234
+ "step": 12000
235
+ },
236
+ {
237
+ "epoch": 9.52,
238
+ "learning_rate": 0.0006826605737496827,
239
+ "loss": 0.6326,
240
+ "step": 12500
241
+ },
242
+ {
243
+ "epoch": 9.9,
244
+ "learning_rate": 0.00066996699669967,
245
+ "loss": 0.6523,
246
+ "step": 13000
247
+ },
248
+ {
249
+ "epoch": 10.0,
250
+ "eval_accuracy": 0.6648149802030305,
251
+ "eval_loss": 1.805672287940979,
252
+ "eval_runtime": 1557.784,
253
+ "eval_samples_per_second": 107.817,
254
+ "eval_steps_per_second": 0.211,
255
+ "step": 13130
256
+ },
257
+ {
258
+ "epoch": 10.28,
259
+ "learning_rate": 0.0006572734196496572,
260
+ "loss": 0.602,
261
+ "step": 13500
262
+ },
263
+ {
264
+ "epoch": 10.66,
265
+ "learning_rate": 0.0006445798425996446,
266
+ "loss": 0.5976,
267
+ "step": 14000
268
+ },
269
+ {
270
+ "epoch": 11.0,
271
+ "eval_accuracy": 0.6706736923580721,
272
+ "eval_loss": 1.8513981103897095,
273
+ "eval_runtime": 1548.9015,
274
+ "eval_samples_per_second": 108.435,
275
+ "eval_steps_per_second": 0.212,
276
+ "step": 14443
277
+ },
278
+ {
279
+ "epoch": 11.04,
280
+ "learning_rate": 0.0006318862655496319,
281
+ "loss": 0.6049,
282
+ "step": 14500
283
+ },
284
+ {
285
+ "epoch": 11.42,
286
+ "learning_rate": 0.0006191926884996192,
287
+ "loss": 0.5476,
288
+ "step": 15000
289
+ },
290
+ {
291
+ "epoch": 11.81,
292
+ "learning_rate": 0.0006064991114496065,
293
+ "loss": 0.5743,
294
+ "step": 15500
295
+ },
296
+ {
297
+ "epoch": 12.0,
298
+ "eval_accuracy": 0.6628501681998155,
299
+ "eval_loss": 1.927115559577942,
300
+ "eval_runtime": 1525.7141,
301
+ "eval_samples_per_second": 110.083,
302
+ "eval_steps_per_second": 0.216,
303
+ "step": 15756
304
+ },
305
+ {
306
+ "epoch": 12.19,
307
+ "learning_rate": 0.0005938055343995938,
308
+ "loss": 0.5441,
309
+ "step": 16000
310
+ },
311
+ {
312
+ "epoch": 12.57,
313
+ "learning_rate": 0.0005811119573495812,
314
+ "loss": 0.5232,
315
+ "step": 16500
316
+ },
317
+ {
318
+ "epoch": 12.95,
319
+ "learning_rate": 0.0005684183802995684,
320
+ "loss": 0.5426,
321
+ "step": 17000
322
+ },
323
+ {
324
+ "epoch": 13.0,
325
+ "eval_accuracy": 0.6691911523920098,
326
+ "eval_loss": 1.9220695495605469,
327
+ "eval_runtime": 1530.5139,
328
+ "eval_samples_per_second": 109.738,
329
+ "eval_steps_per_second": 0.215,
330
+ "step": 17069
331
+ },
332
+ {
333
+ "epoch": 13.33,
334
+ "learning_rate": 0.0005557248032495558,
335
+ "loss": 0.5004,
336
+ "step": 17500
337
+ },
338
+ {
339
+ "epoch": 13.71,
340
+ "learning_rate": 0.0005430312261995431,
341
+ "loss": 0.5092,
342
+ "step": 18000
343
+ },
344
+ {
345
+ "epoch": 14.0,
346
+ "eval_accuracy": 0.6751987139412342,
347
+ "eval_loss": 1.9163544178009033,
348
+ "eval_runtime": 1663.4966,
349
+ "eval_samples_per_second": 100.965,
350
+ "eval_steps_per_second": 0.198,
351
+ "step": 18382
352
+ },
353
+ {
354
+ "epoch": 14.09,
355
+ "learning_rate": 0.0005303376491495303,
356
+ "loss": 0.5017,
357
+ "step": 18500
358
+ },
359
+ {
360
+ "epoch": 14.47,
361
+ "learning_rate": 0.0005176440720995177,
362
+ "loss": 0.4729,
363
+ "step": 19000
364
+ },
365
+ {
366
+ "epoch": 14.85,
367
+ "learning_rate": 0.000504950495049505,
368
+ "loss": 0.4808,
369
+ "step": 19500
370
+ },
371
+ {
372
+ "epoch": 15.0,
373
+ "eval_accuracy": 0.6743115715519038,
374
+ "eval_loss": 1.925864815711975,
375
+ "eval_runtime": 1533.1814,
376
+ "eval_samples_per_second": 109.547,
377
+ "eval_steps_per_second": 0.215,
378
+ "step": 19695
379
+ },
380
+ {
381
+ "epoch": 15.23,
382
+ "learning_rate": 0.0004922569179994923,
383
+ "loss": 0.4595,
384
+ "step": 20000
385
+ },
386
+ {
387
+ "epoch": 15.61,
388
+ "learning_rate": 0.00047956334094947955,
389
+ "loss": 0.4489,
390
+ "step": 20500
391
+ },
392
+ {
393
+ "epoch": 15.99,
394
+ "learning_rate": 0.00046686976389946687,
395
+ "loss": 0.4611,
396
+ "step": 21000
397
+ },
398
+ {
399
+ "epoch": 16.0,
400
+ "eval_accuracy": 0.6784972165163288,
401
+ "eval_loss": 1.9857261180877686,
402
+ "eval_runtime": 1537.6389,
403
+ "eval_samples_per_second": 109.229,
404
+ "eval_steps_per_second": 0.214,
405
+ "step": 21008
406
+ },
407
+ {
408
+ "epoch": 16.0,
409
+ "step": 21008,
410
+ "total_flos": 7.331020593786202e+20,
411
+ "train_loss": 0.0,
412
+ "train_runtime": 372.6046,
413
+ "train_samples_per_second": 27045.44,
414
+ "train_steps_per_second": 52.858
415
+ }
416
+ ],
417
+ "logging_steps": 500,
418
+ "max_steps": 19695,
419
+ "num_train_epochs": 15,
420
+ "save_steps": 500,
421
+ "total_flos": 7.331020593786202e+20,
422
+ "trial_name": null,
423
+ "trial_params": null
424
+ }