pierreguillou commited on
Commit
f3e3bd7
β€’
1 Parent(s): 91b6951

End of training

Browse files
checkpoint-11000/pytorch_model.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:9c57e05d3f7e9c882e3cf561394a94532ce7d4df59b422bf335fad1498c1cc3e
3
- size 1134425553
 
 
 
 
checkpoint-11000/rng_state.pth DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:edc6c1a25455a0ac08a6ba15e2bb0949f0e47c53b5d7e9f6781b4d75bdb78a0d
3
- size 14575
 
 
 
 
checkpoint-11000/scaler.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:b1cf22c2871c42a245e6e913d024763352b9f1be40e2deb2b845f641c7d0252c
3
- size 557
 
 
 
 
checkpoint-11000/trainer_state.json DELETED
@@ -1,412 +0,0 @@
1
- {
2
- "best_metric": 0.8849383152916955,
3
- "best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_ml384-v2/checkpoint-8500",
4
- "epoch": 4.570004154549231,
5
- "global_step": 11000,
6
- "is_hyper_param_search": false,
7
- "is_local_process_zero": true,
8
- "is_world_process_zero": true,
9
- "log_history": [
10
- {
11
- "epoch": 0.21,
12
- "learning_rate": 4.793934358122144e-05,
13
- "loss": 0.7223,
14
- "step": 500
15
- },
16
- {
17
- "epoch": 0.21,
18
- "eval_accuracy": 0.7741471103890881,
19
- "eval_f1": 0.7741471103890881,
20
- "eval_loss": 0.7764509916305542,
21
- "eval_precision": 0.7741471103890881,
22
- "eval_recall": 0.7741471103890881,
23
- "eval_runtime": 33.2902,
24
- "eval_samples_per_second": 61.64,
25
- "eval_steps_per_second": 3.875,
26
- "step": 500
27
- },
28
- {
29
- "epoch": 0.42,
30
- "learning_rate": 4.5870378063980065e-05,
31
- "loss": 0.4469,
32
- "step": 1000
33
- },
34
- {
35
- "epoch": 0.42,
36
- "eval_accuracy": 0.8311511798105226,
37
- "eval_f1": 0.8311511798105226,
38
- "eval_loss": 0.5913723707199097,
39
- "eval_precision": 0.8311511798105226,
40
- "eval_recall": 0.8311511798105226,
41
- "eval_runtime": 37.4699,
42
- "eval_samples_per_second": 54.764,
43
- "eval_steps_per_second": 3.443,
44
- "step": 1000
45
- },
46
- {
47
- "epoch": 0.62,
48
- "learning_rate": 4.3793103448275864e-05,
49
- "loss": 0.3819,
50
- "step": 1500
51
- },
52
- {
53
- "epoch": 0.62,
54
- "eval_accuracy": 0.8102330668639719,
55
- "eval_f1": 0.8102330668639719,
56
- "eval_loss": 0.8744572997093201,
57
- "eval_precision": 0.8102330668639719,
58
- "eval_recall": 0.8102330668639719,
59
- "eval_runtime": 34.6123,
60
- "eval_samples_per_second": 59.285,
61
- "eval_steps_per_second": 3.727,
62
- "step": 1500
63
- },
64
- {
65
- "epoch": 0.83,
66
- "learning_rate": 4.171582883257167e-05,
67
- "loss": 0.3361,
68
- "step": 2000
69
- },
70
- {
71
- "epoch": 0.83,
72
- "eval_accuracy": 0.8337166846278812,
73
- "eval_f1": 0.8337166846278812,
74
- "eval_loss": 0.6990912556648254,
75
- "eval_precision": 0.8337166846278812,
76
- "eval_recall": 0.8337166846278812,
77
- "eval_runtime": 38.6559,
78
- "eval_samples_per_second": 53.084,
79
- "eval_steps_per_second": 3.337,
80
- "step": 2000
81
- },
82
- {
83
- "epoch": 1.04,
84
- "learning_rate": 3.964270876609888e-05,
85
- "loss": 0.2784,
86
- "step": 2500
87
- },
88
- {
89
- "epoch": 1.04,
90
- "eval_accuracy": 0.8119380418523106,
91
- "eval_f1": 0.8119380418523107,
92
- "eval_loss": 0.7512525320053101,
93
- "eval_precision": 0.8119380418523106,
94
- "eval_recall": 0.8119380418523106,
95
- "eval_runtime": 33.6314,
96
- "eval_samples_per_second": 61.014,
97
- "eval_steps_per_second": 3.836,
98
- "step": 2500
99
- },
100
- {
101
- "epoch": 1.25,
102
- "learning_rate": 3.756543415039468e-05,
103
- "loss": 0.2377,
104
- "step": 3000
105
- },
106
- {
107
- "epoch": 1.25,
108
- "eval_accuracy": 0.8165945537308391,
109
- "eval_f1": 0.8165945537308391,
110
- "eval_loss": 0.9047627449035645,
111
- "eval_precision": 0.8165945537308391,
112
- "eval_recall": 0.8165945537308391,
113
- "eval_runtime": 39.8436,
114
- "eval_samples_per_second": 51.501,
115
- "eval_steps_per_second": 3.238,
116
- "step": 3000
117
- },
118
- {
119
- "epoch": 1.45,
120
- "learning_rate": 3.548815953469049e-05,
121
- "loss": 0.2401,
122
- "step": 3500
123
- },
124
- {
125
- "epoch": 1.45,
126
- "eval_accuracy": 0.7939071271171446,
127
- "eval_f1": 0.7939071271171445,
128
- "eval_loss": 1.241086721420288,
129
- "eval_precision": 0.7939071271171446,
130
- "eval_recall": 0.7939071271171446,
131
- "eval_runtime": 34.8048,
132
- "eval_samples_per_second": 58.957,
133
- "eval_steps_per_second": 3.706,
134
- "step": 3500
135
- },
136
- {
137
- "epoch": 1.66,
138
- "learning_rate": 3.341088491898629e-05,
139
- "loss": 0.2054,
140
- "step": 4000
141
- },
142
- {
143
- "epoch": 1.66,
144
- "eval_accuracy": 0.8079812131057889,
145
- "eval_f1": 0.8079812131057889,
146
- "eval_loss": 1.1594407558441162,
147
- "eval_precision": 0.8079812131057889,
148
- "eval_recall": 0.8079812131057889,
149
- "eval_runtime": 39.5136,
150
- "eval_samples_per_second": 51.932,
151
- "eval_steps_per_second": 3.265,
152
- "step": 4000
153
- },
154
- {
155
- "epoch": 1.87,
156
- "learning_rate": 3.133361030328209e-05,
157
- "loss": 0.1909,
158
- "step": 4500
159
- },
160
- {
161
- "epoch": 1.87,
162
- "eval_accuracy": 0.8424747872802432,
163
- "eval_f1": 0.842474787280243,
164
- "eval_loss": 0.7545156478881836,
165
- "eval_precision": 0.8424747872802432,
166
- "eval_recall": 0.8424747872802432,
167
- "eval_runtime": 35.061,
168
- "eval_samples_per_second": 58.527,
169
- "eval_steps_per_second": 3.679,
170
- "step": 4500
171
- },
172
- {
173
- "epoch": 2.08,
174
- "learning_rate": 2.9256335687577903e-05,
175
- "loss": 0.1704,
176
- "step": 5000
177
- },
178
- {
179
- "epoch": 2.08,
180
- "eval_accuracy": 0.8317543549243216,
181
- "eval_f1": 0.8317543549243216,
182
- "eval_loss": 0.856721818447113,
183
- "eval_precision": 0.8317543549243216,
184
- "eval_recall": 0.8317543549243216,
185
- "eval_runtime": 38.2513,
186
- "eval_samples_per_second": 53.645,
187
- "eval_steps_per_second": 3.372,
188
- "step": 5000
189
- },
190
- {
191
- "epoch": 2.29,
192
- "learning_rate": 2.7179061071873702e-05,
193
- "loss": 0.1294,
194
- "step": 5500
195
- },
196
- {
197
- "epoch": 2.29,
198
- "eval_accuracy": 0.8489327821653182,
199
- "eval_f1": 0.8489327821653182,
200
- "eval_loss": 0.8485749959945679,
201
- "eval_precision": 0.8489327821653182,
202
- "eval_recall": 0.8489327821653182,
203
- "eval_runtime": 33.5765,
204
- "eval_samples_per_second": 61.114,
205
- "eval_steps_per_second": 3.842,
206
- "step": 5500
207
- },
208
- {
209
- "epoch": 2.49,
210
- "learning_rate": 2.5101786456169508e-05,
211
- "loss": 0.134,
212
- "step": 6000
213
- },
214
- {
215
- "epoch": 2.49,
216
- "eval_accuracy": 0.8573209374145502,
217
- "eval_f1": 0.8573209374145502,
218
- "eval_loss": 0.7681939005851746,
219
- "eval_precision": 0.8573209374145502,
220
- "eval_recall": 0.8573209374145502,
221
- "eval_runtime": 39.5768,
222
- "eval_samples_per_second": 51.849,
223
- "eval_steps_per_second": 3.259,
224
- "step": 6000
225
- },
226
- {
227
- "epoch": 2.7,
228
- "learning_rate": 2.302451184046531e-05,
229
- "loss": 0.1354,
230
- "step": 6500
231
- },
232
- {
233
- "epoch": 2.7,
234
- "eval_accuracy": 0.8255697994241689,
235
- "eval_f1": 0.8255697994241689,
236
- "eval_loss": 0.9870807528495789,
237
- "eval_precision": 0.8255697994241689,
238
- "eval_recall": 0.8255697994241689,
239
- "eval_runtime": 34.6532,
240
- "eval_samples_per_second": 59.215,
241
- "eval_steps_per_second": 3.723,
242
- "step": 6500
243
- },
244
- {
245
- "epoch": 2.91,
246
- "learning_rate": 2.0947237224761117e-05,
247
- "loss": 0.1239,
248
- "step": 7000
249
- },
250
- {
251
- "epoch": 2.91,
252
- "eval_accuracy": 0.8189268308375287,
253
- "eval_f1": 0.8189268308375287,
254
- "eval_loss": 1.1430405378341675,
255
- "eval_precision": 0.8189268308375287,
256
- "eval_recall": 0.8189268308375287,
257
- "eval_runtime": 39.4751,
258
- "eval_samples_per_second": 51.982,
259
- "eval_steps_per_second": 3.268,
260
- "step": 7000
261
- },
262
- {
263
- "epoch": 3.12,
264
- "learning_rate": 1.886996260905692e-05,
265
- "loss": 0.1012,
266
- "step": 7500
267
- },
268
- {
269
- "epoch": 3.12,
270
- "eval_accuracy": 0.8385581702079747,
271
- "eval_f1": 0.8385581702079747,
272
- "eval_loss": 0.8271787166595459,
273
- "eval_precision": 0.8385581702079747,
274
- "eval_recall": 0.8385581702079747,
275
- "eval_runtime": 33.307,
276
- "eval_samples_per_second": 61.609,
277
- "eval_steps_per_second": 3.873,
278
- "step": 7500
279
- },
280
- {
281
- "epoch": 3.32,
282
- "learning_rate": 1.6792687993352722e-05,
283
- "loss": 0.0788,
284
- "step": 8000
285
- },
286
- {
287
- "epoch": 3.32,
288
- "eval_accuracy": 0.8364993324862074,
289
- "eval_f1": 0.8364993324862076,
290
- "eval_loss": 1.028805136680603,
291
- "eval_precision": 0.8364993324862074,
292
- "eval_recall": 0.8364993324862074,
293
- "eval_runtime": 38.2117,
294
- "eval_samples_per_second": 53.701,
295
- "eval_steps_per_second": 3.376,
296
- "step": 8000
297
- },
298
- {
299
- "epoch": 3.53,
300
- "learning_rate": 1.4715413377648527e-05,
301
- "loss": 0.0802,
302
- "step": 8500
303
- },
304
- {
305
- "epoch": 3.53,
306
- "eval_accuracy": 0.8849383152916955,
307
- "eval_f1": 0.8849383152916955,
308
- "eval_loss": 0.719699501991272,
309
- "eval_precision": 0.8849383152916955,
310
- "eval_recall": 0.8849383152916955,
311
- "eval_runtime": 34.4056,
312
- "eval_samples_per_second": 59.641,
313
- "eval_steps_per_second": 3.749,
314
- "step": 8500
315
- },
316
- {
317
- "epoch": 3.74,
318
- "learning_rate": 1.263813876194433e-05,
319
- "loss": 0.0861,
320
- "step": 9000
321
- },
322
- {
323
- "epoch": 3.74,
324
- "eval_accuracy": 0.8319634556304386,
325
- "eval_f1": 0.8319634556304386,
326
- "eval_loss": 1.1419589519500732,
327
- "eval_precision": 0.8319634556304386,
328
- "eval_recall": 0.8319634556304386,
329
- "eval_runtime": 39.7118,
330
- "eval_samples_per_second": 51.672,
331
- "eval_steps_per_second": 3.248,
332
- "step": 9000
333
- },
334
- {
335
- "epoch": 3.95,
336
- "learning_rate": 1.0560864146240134e-05,
337
- "loss": 0.0639,
338
- "step": 9500
339
- },
340
- {
341
- "epoch": 3.95,
342
- "eval_accuracy": 0.8585272876421483,
343
- "eval_f1": 0.8585272876421483,
344
- "eval_loss": 0.9562506079673767,
345
- "eval_precision": 0.8585272876421483,
346
- "eval_recall": 0.8585272876421483,
347
- "eval_runtime": 33.8854,
348
- "eval_samples_per_second": 60.557,
349
- "eval_steps_per_second": 3.807,
350
- "step": 9500
351
- },
352
- {
353
- "epoch": 4.15,
354
- "learning_rate": 8.483589530535937e-06,
355
- "loss": 0.0464,
356
- "step": 10000
357
- },
358
- {
359
- "epoch": 4.15,
360
- "eval_accuracy": 0.8510961702401442,
361
- "eval_f1": 0.8510961702401442,
362
- "eval_loss": 1.0767754316329956,
363
- "eval_precision": 0.8510961702401442,
364
- "eval_recall": 0.8510961702401442,
365
- "eval_runtime": 38.7314,
366
- "eval_samples_per_second": 52.98,
367
- "eval_steps_per_second": 3.331,
368
- "step": 10000
369
- },
370
- {
371
- "epoch": 4.36,
372
- "learning_rate": 6.406314914831742e-06,
373
- "loss": 0.0412,
374
- "step": 10500
375
- },
376
- {
377
- "epoch": 4.36,
378
- "eval_accuracy": 0.8439143652185103,
379
- "eval_f1": 0.8439143652185103,
380
- "eval_loss": 1.1184284687042236,
381
- "eval_precision": 0.8439143652185103,
382
- "eval_recall": 0.8439143652185103,
383
- "eval_runtime": 34.8108,
384
- "eval_samples_per_second": 58.947,
385
- "eval_steps_per_second": 3.706,
386
- "step": 10500
387
- },
388
- {
389
- "epoch": 4.57,
390
- "learning_rate": 4.333194848358953e-06,
391
- "loss": 0.039,
392
- "step": 11000
393
- },
394
- {
395
- "epoch": 4.57,
396
- "eval_accuracy": 0.8635778739283588,
397
- "eval_f1": 0.8635778739283588,
398
- "eval_loss": 0.9634060263633728,
399
- "eval_precision": 0.8635778739283588,
400
- "eval_recall": 0.8635778739283588,
401
- "eval_runtime": 39.6244,
402
- "eval_samples_per_second": 51.786,
403
- "eval_steps_per_second": 3.256,
404
- "step": 11000
405
- }
406
- ],
407
- "max_steps": 12035,
408
- "num_train_epochs": 5,
409
- "total_flos": 1.835352614695219e+16,
410
- "trial_name": null,
411
- "trial_params": null
412
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
checkpoint-11500/config.json DELETED
@@ -1,56 +0,0 @@
1
- {
2
- "_name_or_path": "nielsr/lilt-xlm-roberta-base",
3
- "architectures": [
4
- "LiltForTokenClassification"
5
- ],
6
- "attention_probs_dropout_prob": 0.1,
7
- "bos_token_id": 0,
8
- "channel_shrink_ratio": 4,
9
- "classifier_dropout": null,
10
- "eos_token_id": 2,
11
- "hidden_act": "gelu",
12
- "hidden_dropout_prob": 0.1,
13
- "hidden_size": 768,
14
- "id2label": {
15
- "0": "Caption",
16
- "1": "Footnote",
17
- "2": "Formula",
18
- "3": "List-item",
19
- "4": "Page-footer",
20
- "5": "Page-header",
21
- "6": "Picture",
22
- "7": "Section-header",
23
- "8": "Table",
24
- "9": "Text",
25
- "10": "Title"
26
- },
27
- "initializer_range": 0.02,
28
- "intermediate_size": 3072,
29
- "label2id": {
30
- "Caption": 0,
31
- "Footnote": 1,
32
- "Formula": 2,
33
- "List-item": 3,
34
- "Page-footer": 4,
35
- "Page-header": 5,
36
- "Picture": 6,
37
- "Section-header": 7,
38
- "Table": 8,
39
- "Text": 9,
40
- "Title": 10
41
- },
42
- "layer_norm_eps": 1e-05,
43
- "max_2d_position_embeddings": 1024,
44
- "max_position_embeddings": 514,
45
- "model_type": "lilt",
46
- "num_attention_heads": 12,
47
- "num_hidden_layers": 12,
48
- "output_past": true,
49
- "pad_token_id": 1,
50
- "position_embedding_type": "absolute",
51
- "torch_dtype": "float32",
52
- "transformers_version": "4.26.0",
53
- "type_vocab_size": 1,
54
- "use_cache": true,
55
- "vocab_size": 250002
56
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
checkpoint-11500/optimizer.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:a987de3ede3a55ee97ff63886937a088657c2157826f53d07345ccc9c7e5d778
3
- size 2265828101
 
 
 
 
checkpoint-11500/scheduler.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:0ec4d60da8dcded02dd5639d5b8b5174bf534b01c0f3a7ab99393164e017b39f
3
- size 627
 
 
 
 
checkpoint-11500/special_tokens_map.json DELETED
@@ -1,15 +0,0 @@
1
- {
2
- "bos_token": "<s>",
3
- "cls_token": "<s>",
4
- "eos_token": "</s>",
5
- "mask_token": {
6
- "content": "<mask>",
7
- "lstrip": true,
8
- "normalized": false,
9
- "rstrip": false,
10
- "single_word": false
11
- },
12
- "pad_token": "<pad>",
13
- "sep_token": "</s>",
14
- "unk_token": "<unk>"
15
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
checkpoint-11500/tokenizer.json DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:62c24cdc13d4c9952d63718d6c9fa4c287974249e16b7ade6d5a85e7bbb75626
3
- size 17082660
 
 
 
 
checkpoint-11500/tokenizer_config.json DELETED
@@ -1,20 +0,0 @@
1
- {
2
- "bos_token": "<s>",
3
- "cls_token": "<s>",
4
- "eos_token": "</s>",
5
- "mask_token": {
6
- "__type": "AddedToken",
7
- "content": "<mask>",
8
- "lstrip": true,
9
- "normalized": true,
10
- "rstrip": false,
11
- "single_word": false
12
- },
13
- "model_max_length": 512,
14
- "name_or_path": "nielsr/lilt-xlm-roberta-base",
15
- "pad_token": "<pad>",
16
- "sep_token": "</s>",
17
- "special_tokens_map_file": null,
18
- "tokenizer_class": "XLMRobertaTokenizer",
19
- "unk_token": "<unk>"
20
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
checkpoint-11500/training_args.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:2b3cb303483efa6f2dc51db1cfb9b16000da398e2d72673041025bfff104b3b8
3
- size 3643
 
 
 
 
{checkpoint-11000 β†’ checkpoint-12000}/config.json RENAMED
File without changes
{checkpoint-11000 β†’ checkpoint-12000}/optimizer.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a373613aeeb4d6be34886b231335f8c8f20879c526ba375b702a8ec78acc96a8
3
  size 2265828101
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0377763861e1565e68485e8f32b7a5c377a24284acd536ab0029416d61d03d48
3
  size 2265828101
{checkpoint-11500 β†’ checkpoint-12000}/pytorch_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9a336d572b84d95a1c812e645a72e90873027257b83cee92eef0d3a78890c576
3
  size 1134425553
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9b13e786aeddc70907b9ab2ab994abb01bbd8b9fc1b605eb6d43b6bd26a7bf0
3
  size 1134425553
{checkpoint-11500 β†’ checkpoint-12000}/rng_state.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e0b8ef7d104554cd305a60fb7a5d256c7f82cfc12dc853397197d87e16ef1f65
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9977b81b71597a1403649a2cd7ca5af0ff76ea09f7cc4fd6954a25d51c950458
3
  size 14575
{checkpoint-11500 β†’ checkpoint-12000}/scaler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0ee4f114f4e57c077eb75e91b7efc254c244508b080b0e6980415bdd75809aff
3
  size 557
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ade8adec025aa8c55d5922c910484f65a4f9a8ee23da0b6291286fb7fdd6926a
3
  size 557
{checkpoint-11000 β†’ checkpoint-12000}/scheduler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6bc076744799314c413b1a22fd57768d86453e79c6cbb2e75e964b3a373c4958
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d9dec43e359a11ff94e53c08c39c3034d0df5115ac402825b9258dc21576cba
3
  size 627
{checkpoint-11000 β†’ checkpoint-12000}/special_tokens_map.json RENAMED
File without changes
{checkpoint-11000 β†’ checkpoint-12000}/tokenizer.json RENAMED
File without changes
{checkpoint-11000 β†’ checkpoint-12000}/tokenizer_config.json RENAMED
File without changes
{checkpoint-11500 β†’ checkpoint-12000}/trainer_state.json RENAMED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": 0.8849383152916955,
3
  "best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_ml384-v2/checkpoint-8500",
4
- "epoch": 4.777731616119651,
5
- "global_step": 11500,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -420,11 +420,29 @@
420
  "eval_samples_per_second": 58.569,
421
  "eval_steps_per_second": 3.682,
422
  "step": 11500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
423
  }
424
  ],
425
  "max_steps": 12035,
426
  "num_train_epochs": 5,
427
- "total_flos": 1.918804286349619e+16,
428
  "trial_name": null,
429
  "trial_params": null
430
  }
 
1
  {
2
  "best_metric": 0.8849383152916955,
3
  "best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_ml384-v2/checkpoint-8500",
4
+ "epoch": 4.985459077690071,
5
+ "global_step": 12000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
420
  "eval_samples_per_second": 58.569,
421
  "eval_steps_per_second": 3.682,
422
  "step": 11500
423
+ },
424
+ {
425
+ "epoch": 4.99,
426
+ "learning_rate": 1.7864561695056087e-07,
427
+ "loss": 0.0395,
428
+ "step": 12000
429
+ },
430
+ {
431
+ "epoch": 4.99,
432
+ "eval_accuracy": 0.8583503562754339,
433
+ "eval_f1": 0.8583503562754339,
434
+ "eval_loss": 1.0003422498703003,
435
+ "eval_precision": 0.8583503562754339,
436
+ "eval_recall": 0.8583503562754339,
437
+ "eval_runtime": 39.4996,
438
+ "eval_samples_per_second": 51.95,
439
+ "eval_steps_per_second": 3.266,
440
+ "step": 12000
441
  }
442
  ],
443
  "max_steps": 12035,
444
  "num_train_epochs": 5,
445
+ "total_flos": 2.002255958004019e+16,
446
  "trial_name": null,
447
  "trial_params": null
448
  }
{checkpoint-11000 β†’ checkpoint-12000}/training_args.bin RENAMED
File without changes
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9a336d572b84d95a1c812e645a72e90873027257b83cee92eef0d3a78890c576
3
  size 1134425553
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e39c7d7515bc3fd9710bfa20bd4d1d7c408894096e55b518c4e64c07ac0ff33b
3
  size 1134425553
runs/Feb09_15-43-15_f1c8d3a96fe7/events.out.tfevents.1675957409.f1c8d3a96fe7.143.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:21b09326263f0fbe132c2f3bc4c0d88999487e384816c9a0719ad3719c72fd3d
3
- size 19096
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6995b72b1d777bdf7ca3001094bdb7626e66b36cb75e85a842900924e4a2f0d7
3
+ size 20079