oschamp commited on
Commit
bc0d2d6
1 Parent(s): 1f438f9

End of training

Browse files
all_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
- "epoch": 8.0,
3
- "eval_accuracy": 0.4887640449438202,
4
- "eval_loss": 1.3362700939178467,
5
- "eval_runtime": 1.464,
6
- "eval_samples_per_second": 121.585,
7
- "eval_steps_per_second": 15.71,
8
- "train_loss": 0.6919720236744199,
9
- "train_runtime": 221.2781,
10
- "train_samples_per_second": 64.1,
11
- "train_steps_per_second": 2.025
12
  }
 
1
  {
2
+ "epoch": 4.0,
3
+ "eval_accuracy": 0.5947786606129398,
4
+ "eval_loss": 1.1392158269882202,
5
+ "eval_runtime": 7.247,
6
+ "eval_samples_per_second": 121.567,
7
+ "eval_steps_per_second": 15.317,
8
+ "train_loss": 0.7775138853479633,
9
+ "train_runtime": 613.7183,
10
+ "train_samples_per_second": 57.909,
11
+ "train_steps_per_second": 1.812
12
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 8.0,
3
- "eval_accuracy": 0.4887640449438202,
4
- "eval_loss": 1.3362700939178467,
5
- "eval_runtime": 1.464,
6
- "eval_samples_per_second": 121.585,
7
- "eval_steps_per_second": 15.71
8
  }
 
1
  {
2
+ "epoch": 4.0,
3
+ "eval_accuracy": 0.5947786606129398,
4
+ "eval_loss": 1.1392158269882202,
5
+ "eval_runtime": 7.247,
6
+ "eval_samples_per_second": 121.567,
7
+ "eval_steps_per_second": 15.317
8
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8c9d9ca1c7cc02ffd2ae4d152309d2ae52a11c26cd61cdc65043c0fd840af521
3
  size 343290221
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa4b52595c9f1ae8aabee148abbf8e0e816620c266821f687930ff4b31bded53
3
  size 343290221
runs/Feb22_09-09-32_OSchamp-PC/1677053372.6353683/events.out.tfevents.1677053372.OSchamp-PC.24028.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5bac4d583c736b4b44b116d1325a6a9f16c4a021756cd753fffc6131dfbacb1d
3
+ size 5741
runs/Feb22_09-09-32_OSchamp-PC/events.out.tfevents.1677053372.OSchamp-PC.24028.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:802d4fb16ee0ca0e226182fae64cd493cd756ce79c064419b75bb2c0b331bdea
3
+ size 21421
runs/Feb22_09-36-47_OSchamp-PC/1677055007.7834058/events.out.tfevents.1677055007.OSchamp-PC.4212.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cdc4151a23bc749a3da9eaf790d7dd5ab441c2cfe9a6280b6c0243f4991e1b3c
3
+ size 5741
runs/Feb22_09-36-47_OSchamp-PC/events.out.tfevents.1677055007.OSchamp-PC.4212.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4ac4c513f66cbab58a313d3ca52caa59cf247b42b5e88cd86da756356c65f30
3
+ size 11582
runs/Feb22_09-36-47_OSchamp-PC/events.out.tfevents.1677055629.OSchamp-PC.4212.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d5ab12ef82b4889b74b0982e21f33851fad8edda6aa0480726542c888b0971f
3
+ size 411
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "epoch": 8.0,
3
- "train_loss": 0.6919720236744199,
4
- "train_runtime": 221.2781,
5
- "train_samples_per_second": 64.1,
6
- "train_steps_per_second": 2.025
7
  }
 
1
  {
2
+ "epoch": 4.0,
3
+ "train_loss": 0.7775138853479633,
4
+ "train_runtime": 613.7183,
5
+ "train_samples_per_second": 57.909,
6
+ "train_steps_per_second": 1.812
7
  }
trainer_state.json CHANGED
@@ -1,109 +1,256 @@
1
  {
2
- "best_metric": 1.3362700939178467,
3
- "best_model_checkpoint": "./vit-artworkclassifier\\checkpoint-200",
4
- "epoch": 8.0,
5
- "global_step": 448,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
- "epoch": 0.89,
12
- "learning_rate": 8.883928571428571e-05,
13
- "loss": 1.9187,
14
  "step": 50
15
  },
16
  {
17
- "epoch": 1.79,
18
- "learning_rate": 7.767857142857144e-05,
19
- "loss": 1.4136,
20
  "step": 100
21
  },
22
  {
23
- "epoch": 1.79,
24
- "eval_accuracy": 0.5112359550561798,
25
- "eval_loss": 1.5092945098876953,
26
- "eval_runtime": 1.5015,
27
- "eval_samples_per_second": 118.548,
28
- "eval_steps_per_second": 15.318,
29
  "step": 100
30
  },
31
  {
32
- "epoch": 2.68,
33
- "learning_rate": 6.651785714285714e-05,
34
- "loss": 1.0465,
35
  "step": 150
36
  },
37
  {
38
- "epoch": 3.57,
39
- "learning_rate": 5.535714285714286e-05,
40
- "loss": 0.7189,
41
  "step": 200
42
  },
43
  {
44
- "epoch": 3.57,
45
- "eval_accuracy": 0.4887640449438202,
46
- "eval_loss": 1.3362700939178467,
47
- "eval_runtime": 1.475,
48
- "eval_samples_per_second": 120.678,
49
- "eval_steps_per_second": 15.593,
50
  "step": 200
51
  },
52
  {
53
- "epoch": 4.46,
54
- "learning_rate": 4.419642857142857e-05,
55
- "loss": 0.4243,
56
  "step": 250
57
  },
58
  {
59
- "epoch": 5.36,
60
- "learning_rate": 3.303571428571429e-05,
61
- "loss": 0.2717,
62
  "step": 300
63
  },
64
  {
65
- "epoch": 5.36,
66
- "eval_accuracy": 0.5280898876404494,
67
- "eval_loss": 1.490658164024353,
68
- "eval_runtime": 1.4785,
69
- "eval_samples_per_second": 120.393,
70
- "eval_steps_per_second": 15.556,
71
  "step": 300
72
  },
73
  {
74
- "epoch": 6.25,
75
- "learning_rate": 2.1875e-05,
76
- "loss": 0.184,
77
  "step": 350
78
  },
79
  {
80
- "epoch": 7.14,
81
- "learning_rate": 1.0714285714285714e-05,
82
- "loss": 0.1227,
83
  "step": 400
84
  },
85
  {
86
- "epoch": 7.14,
87
- "eval_accuracy": 0.5561797752808989,
88
- "eval_loss": 1.4826292991638184,
89
- "eval_runtime": 1.463,
90
- "eval_samples_per_second": 121.668,
91
- "eval_steps_per_second": 15.721,
92
  "step": 400
93
  },
94
  {
95
- "epoch": 8.0,
96
- "step": 448,
97
- "total_flos": 1.0992153398028042e+18,
98
- "train_loss": 0.6919720236744199,
99
- "train_runtime": 221.2781,
100
- "train_samples_per_second": 64.1,
101
- "train_steps_per_second": 2.025
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
102
  }
103
  ],
104
- "max_steps": 448,
105
- "num_train_epochs": 8,
106
- "total_flos": 1.0992153398028042e+18,
107
  "trial_name": null,
108
  "trial_params": null
109
  }
 
1
  {
2
+ "best_metric": 1.1392158269882202,
3
+ "best_model_checkpoint": "./vit-artworkclassifier\\checkpoint-600",
4
+ "epoch": 4.0,
5
+ "global_step": 1112,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
+ "epoch": 0.18,
12
+ "learning_rate": 9.550359712230216e-05,
13
+ "loss": 1.9425,
14
  "step": 50
15
  },
16
  {
17
+ "epoch": 0.36,
18
+ "learning_rate": 9.100719424460432e-05,
19
+ "loss": 1.5906,
20
  "step": 100
21
  },
22
  {
23
+ "epoch": 0.36,
24
+ "eval_accuracy": 0.48467650397275824,
25
+ "eval_loss": 1.4708987474441528,
26
+ "eval_runtime": 7.3715,
27
+ "eval_samples_per_second": 119.514,
28
+ "eval_steps_per_second": 15.058,
29
  "step": 100
30
  },
31
  {
32
+ "epoch": 0.54,
33
+ "learning_rate": 8.651079136690648e-05,
34
+ "loss": 1.4388,
35
  "step": 150
36
  },
37
  {
38
+ "epoch": 0.72,
39
+ "learning_rate": 8.201438848920863e-05,
40
+ "loss": 1.3395,
41
  "step": 200
42
  },
43
  {
44
+ "epoch": 0.72,
45
+ "eval_accuracy": 0.5073779795686719,
46
+ "eval_loss": 1.3207731246948242,
47
+ "eval_runtime": 7.4035,
48
+ "eval_samples_per_second": 118.998,
49
+ "eval_steps_per_second": 14.993,
50
  "step": 200
51
  },
52
  {
53
+ "epoch": 0.9,
54
+ "learning_rate": 7.751798561151079e-05,
55
+ "loss": 1.3275,
56
  "step": 250
57
  },
58
  {
59
+ "epoch": 1.08,
60
+ "learning_rate": 7.302158273381295e-05,
61
+ "loss": 1.1461,
62
  "step": 300
63
  },
64
  {
65
+ "epoch": 1.08,
66
+ "eval_accuracy": 0.5164585698070374,
67
+ "eval_loss": 1.3362975120544434,
68
+ "eval_runtime": 7.64,
69
+ "eval_samples_per_second": 115.314,
70
+ "eval_steps_per_second": 14.529,
71
  "step": 300
72
  },
73
  {
74
+ "epoch": 1.26,
75
+ "learning_rate": 6.852517985611511e-05,
76
+ "loss": 0.9749,
77
  "step": 350
78
  },
79
  {
80
+ "epoch": 1.44,
81
+ "learning_rate": 6.402877697841726e-05,
82
+ "loss": 0.9593,
83
  "step": 400
84
  },
85
  {
86
+ "epoch": 1.44,
87
+ "eval_accuracy": 0.5845629965947786,
88
+ "eval_loss": 1.1789547204971313,
89
+ "eval_runtime": 7.248,
90
+ "eval_samples_per_second": 121.551,
91
+ "eval_steps_per_second": 15.315,
92
  "step": 400
93
  },
94
  {
95
+ "epoch": 1.62,
96
+ "learning_rate": 5.953237410071942e-05,
97
+ "loss": 0.9175,
98
+ "step": 450
99
+ },
100
+ {
101
+ "epoch": 1.8,
102
+ "learning_rate": 5.512589928057554e-05,
103
+ "loss": 0.8761,
104
+ "step": 500
105
+ },
106
+ {
107
+ "epoch": 1.8,
108
+ "eval_accuracy": 0.5902383654937571,
109
+ "eval_loss": 1.1252126693725586,
110
+ "eval_runtime": 7.2535,
111
+ "eval_samples_per_second": 121.459,
112
+ "eval_steps_per_second": 15.303,
113
+ "step": 500
114
+ },
115
+ {
116
+ "epoch": 1.98,
117
+ "learning_rate": 5.06294964028777e-05,
118
+ "loss": 0.8615,
119
+ "step": 550
120
+ },
121
+ {
122
+ "epoch": 2.16,
123
+ "learning_rate": 4.613309352517986e-05,
124
+ "loss": 0.5922,
125
+ "step": 600
126
+ },
127
+ {
128
+ "epoch": 2.16,
129
+ "eval_accuracy": 0.5947786606129398,
130
+ "eval_loss": 1.1392158269882202,
131
+ "eval_runtime": 7.5695,
132
+ "eval_samples_per_second": 116.388,
133
+ "eval_steps_per_second": 14.664,
134
+ "step": 600
135
+ },
136
+ {
137
+ "epoch": 2.34,
138
+ "learning_rate": 4.163669064748202e-05,
139
+ "loss": 0.4684,
140
+ "step": 650
141
+ },
142
+ {
143
+ "epoch": 2.52,
144
+ "learning_rate": 3.714028776978418e-05,
145
+ "loss": 0.4803,
146
+ "step": 700
147
+ },
148
+ {
149
+ "epoch": 2.52,
150
+ "eval_accuracy": 0.5936435868331441,
151
+ "eval_loss": 1.1560313701629639,
152
+ "eval_runtime": 7.3175,
153
+ "eval_samples_per_second": 120.396,
154
+ "eval_steps_per_second": 15.169,
155
+ "step": 700
156
+ },
157
+ {
158
+ "epoch": 2.7,
159
+ "learning_rate": 3.2643884892086335e-05,
160
+ "loss": 0.4766,
161
+ "step": 750
162
+ },
163
+ {
164
+ "epoch": 2.88,
165
+ "learning_rate": 2.8147482014388493e-05,
166
+ "loss": 0.4454,
167
+ "step": 800
168
+ },
169
+ {
170
+ "epoch": 2.88,
171
+ "eval_accuracy": 0.6118047673098751,
172
+ "eval_loss": 1.1545273065567017,
173
+ "eval_runtime": 7.2475,
174
+ "eval_samples_per_second": 121.559,
175
+ "eval_steps_per_second": 15.316,
176
+ "step": 800
177
+ },
178
+ {
179
+ "epoch": 3.06,
180
+ "learning_rate": 2.3651079136690647e-05,
181
+ "loss": 0.371,
182
+ "step": 850
183
+ },
184
+ {
185
+ "epoch": 3.24,
186
+ "learning_rate": 1.9154676258992808e-05,
187
+ "loss": 0.2271,
188
+ "step": 900
189
+ },
190
+ {
191
+ "epoch": 3.24,
192
+ "eval_accuracy": 0.6038592508513053,
193
+ "eval_loss": 1.2283731698989868,
194
+ "eval_runtime": 7.1705,
195
+ "eval_samples_per_second": 122.865,
196
+ "eval_steps_per_second": 15.48,
197
+ "step": 900
198
+ },
199
+ {
200
+ "epoch": 3.42,
201
+ "learning_rate": 1.4658273381294965e-05,
202
+ "loss": 0.2249,
203
+ "step": 950
204
+ },
205
+ {
206
+ "epoch": 3.6,
207
+ "learning_rate": 1.0161870503597123e-05,
208
+ "loss": 0.207,
209
+ "step": 1000
210
+ },
211
+ {
212
+ "epoch": 3.6,
213
+ "eval_accuracy": 0.5959137343927355,
214
+ "eval_loss": 1.262502670288086,
215
+ "eval_runtime": 7.2385,
216
+ "eval_samples_per_second": 121.71,
217
+ "eval_steps_per_second": 15.335,
218
+ "step": 1000
219
+ },
220
+ {
221
+ "epoch": 3.78,
222
+ "learning_rate": 5.665467625899281e-06,
223
+ "loss": 0.1906,
224
+ "step": 1050
225
+ },
226
+ {
227
+ "epoch": 3.96,
228
+ "learning_rate": 1.169064748201439e-06,
229
+ "loss": 0.1958,
230
+ "step": 1100
231
+ },
232
+ {
233
+ "epoch": 3.96,
234
+ "eval_accuracy": 0.6004540295119183,
235
+ "eval_loss": 1.262100338935852,
236
+ "eval_runtime": 7.2855,
237
+ "eval_samples_per_second": 120.925,
238
+ "eval_steps_per_second": 15.236,
239
+ "step": 1100
240
+ },
241
+ {
242
+ "epoch": 4.0,
243
+ "step": 1112,
244
+ "total_flos": 2.7542380976164454e+18,
245
+ "train_loss": 0.7775138853479633,
246
+ "train_runtime": 613.7183,
247
+ "train_samples_per_second": 57.909,
248
+ "train_steps_per_second": 1.812
249
  }
250
  ],
251
+ "max_steps": 1112,
252
+ "num_train_epochs": 4,
253
+ "total_flos": 2.7542380976164454e+18,
254
  "trial_name": null,
255
  "trial_params": null
256
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e2f0782b18499c0eb146fd57158a7f97d1753735fa78d6d0dda80002fd01c1f7
3
  size 3515
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:22cade885a8be87eda98e5a3fbbf428f0503894f9d241765ed5d6ba07d42d657
3
  size 3515