rpham commited on
Commit
a125d94
1 Parent(s): fdd89e6

Model save

Browse files
Files changed (4) hide show
  1. README.md +3 -3
  2. all_results.json +2 -2
  3. test_results.json +2 -6
  4. trainer_state.json +117 -345
README.md CHANGED
@@ -18,9 +18,9 @@ This model is a fine-tuned version of [MCG-NJU/videomae-base](https://huggingfac
18
  It achieves the following results on the evaluation set:
19
  - eval_loss: 0.9552
20
  - eval_accuracy: 0.7059
21
- - eval_runtime: 7.648
22
- - eval_samples_per_second: 13.337
23
- - eval_steps_per_second: 3.4
24
  - epoch: 2.2541
25
  - step: 186
26
 
 
18
  It achieves the following results on the evaluation set:
19
  - eval_loss: 0.9552
20
  - eval_accuracy: 0.7059
21
+ - eval_runtime: 7.5849
22
+ - eval_samples_per_second: 13.448
23
+ - eval_steps_per_second: 3.428
24
  - epoch: 2.2541
25
  - step: 186
26
 
all_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "epoch": 3.2438524590163933,
3
- "eval_accuracy": 0.7647058823529411,
4
- "eval_loss": 0.8334438800811768,
5
  "eval_runtime": 7.7031,
6
  "eval_samples_per_second": 13.241,
7
  "eval_steps_per_second": 6.621
 
1
  {
2
  "epoch": 3.2438524590163933,
3
+ "eval_accuracy": 0.7058823529411765,
4
+ "eval_loss": 0.9551951289176941,
5
  "eval_runtime": 7.7031,
6
  "eval_samples_per_second": 13.241,
7
  "eval_steps_per_second": 6.621
test_results.json CHANGED
@@ -1,8 +1,4 @@
1
  {
2
- "epoch": 3.2438524590163933,
3
- "eval_accuracy": 0.7647058823529411,
4
- "eval_loss": 0.8334438800811768,
5
- "eval_runtime": 7.7031,
6
- "eval_samples_per_second": 13.241,
7
- "eval_steps_per_second": 6.621
8
  }
 
1
  {
2
+ "eval_accuracy": 0.7058823529411765,
3
+ "eval_loss": 0.9551951289176941
 
 
 
 
4
  }
trainer_state.json CHANGED
@@ -1,415 +1,187 @@
1
  {
2
- "best_metric": 0.7021276595744681,
3
- "best_model_checkpoint": "videomae-base-finetuned-ucf101-subset/checkpoint-488",
4
- "epoch": 3.2438524590163933,
5
  "eval_steps": 500,
6
- "global_step": 488,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.020491803278688523,
13
- "grad_norm": 17.668354034423828,
14
- "learning_rate": 1.0204081632653061e-05,
15
- "loss": 0.5899,
16
  "step": 10
17
  },
18
  {
19
- "epoch": 0.040983606557377046,
20
- "grad_norm": 0.9543402194976807,
21
- "learning_rate": 2.0408163265306123e-05,
22
- "loss": 0.8724,
23
  "step": 20
24
  },
25
  {
26
- "epoch": 0.06147540983606557,
27
- "grad_norm": 32.570133209228516,
28
- "learning_rate": 3.061224489795919e-05,
29
- "loss": 0.8359,
30
  "step": 30
31
  },
32
  {
33
- "epoch": 0.08196721311475409,
34
- "grad_norm": 18.297029495239258,
35
- "learning_rate": 4.0816326530612245e-05,
36
- "loss": 1.0188,
37
  "step": 40
38
  },
39
  {
40
- "epoch": 0.10245901639344263,
41
- "grad_norm": 1.2347818613052368,
42
- "learning_rate": 4.988610478359909e-05,
43
- "loss": 1.1604,
44
  "step": 50
45
  },
46
  {
47
- "epoch": 0.12295081967213115,
48
- "grad_norm": 14.211080551147461,
49
- "learning_rate": 4.874715261958998e-05,
50
- "loss": 0.8299,
51
  "step": 60
52
  },
53
  {
54
- "epoch": 0.14344262295081966,
55
- "grad_norm": 74.23954772949219,
56
- "learning_rate": 4.760820045558087e-05,
57
- "loss": 1.1473,
 
 
 
 
 
 
 
 
 
58
  "step": 70
59
  },
60
  {
61
- "epoch": 0.16393442622950818,
62
- "grad_norm": 14.923948287963867,
63
- "learning_rate": 4.6469248291571756e-05,
64
- "loss": 1.3967,
65
  "step": 80
66
  },
67
  {
68
- "epoch": 0.18442622950819673,
69
- "grad_norm": 26.641878128051758,
70
- "learning_rate": 4.5330296127562645e-05,
71
- "loss": 0.9765,
72
  "step": 90
73
  },
74
  {
75
- "epoch": 0.20491803278688525,
76
- "grad_norm": 1.4160146713256836,
77
- "learning_rate": 4.419134396355353e-05,
78
- "loss": 0.8614,
79
  "step": 100
80
  },
81
  {
82
- "epoch": 0.22540983606557377,
83
- "grad_norm": 0.6423073410987854,
84
- "learning_rate": 4.305239179954442e-05,
85
- "loss": 1.0474,
86
  "step": 110
87
  },
88
  {
89
- "epoch": 0.2459016393442623,
90
- "grad_norm": 12.656720161437988,
91
- "learning_rate": 4.191343963553531e-05,
92
- "loss": 1.4877,
93
  "step": 120
94
  },
95
  {
96
- "epoch": 0.2520491803278688,
97
- "eval_accuracy": 0.48936170212765956,
98
- "eval_loss": 1.489047884941101,
99
- "eval_runtime": 3.5398,
100
- "eval_samples_per_second": 13.278,
101
- "eval_steps_per_second": 6.78,
102
- "step": 123
103
  },
104
  {
105
- "epoch": 1.014344262295082,
106
- "grad_norm": 151.98411560058594,
107
- "learning_rate": 4.07744874715262e-05,
108
- "loss": 1.5679,
109
  "step": 130
110
  },
111
  {
112
- "epoch": 1.0348360655737705,
113
- "grad_norm": 104.5379638671875,
114
- "learning_rate": 3.9635535307517086e-05,
115
- "loss": 0.7741,
116
  "step": 140
117
  },
118
  {
119
- "epoch": 1.055327868852459,
120
- "grad_norm": 11.863714218139648,
121
- "learning_rate": 3.8496583143507975e-05,
122
- "loss": 0.9627,
123
  "step": 150
124
  },
125
  {
126
- "epoch": 1.0758196721311475,
127
- "grad_norm": 2.847776412963867,
128
- "learning_rate": 3.735763097949886e-05,
129
- "loss": 0.6829,
130
  "step": 160
131
  },
132
  {
133
- "epoch": 1.096311475409836,
134
- "grad_norm": 7.588573455810547,
135
- "learning_rate": 3.621867881548975e-05,
136
- "loss": 0.8791,
137
  "step": 170
138
  },
139
  {
140
- "epoch": 1.1168032786885247,
141
- "grad_norm": 39.9682502746582,
142
- "learning_rate": 3.507972665148064e-05,
143
- "loss": 1.5947,
144
  "step": 180
145
  },
146
  {
147
- "epoch": 1.1372950819672132,
148
- "grad_norm": 36.84199142456055,
149
- "learning_rate": 3.394077448747153e-05,
150
- "loss": 0.6469,
151
- "step": 190
152
- },
153
- {
154
- "epoch": 1.1577868852459017,
155
- "grad_norm": 3.502577304840088,
156
- "learning_rate": 3.2801822323462416e-05,
157
- "loss": 0.6792,
158
- "step": 200
159
- },
160
- {
161
- "epoch": 1.1782786885245902,
162
- "grad_norm": 48.51677703857422,
163
- "learning_rate": 3.1662870159453304e-05,
164
- "loss": 0.8278,
165
- "step": 210
166
- },
167
- {
168
- "epoch": 1.1987704918032787,
169
- "grad_norm": 18.526588439941406,
170
- "learning_rate": 3.052391799544419e-05,
171
- "loss": 1.0883,
172
- "step": 220
173
- },
174
- {
175
- "epoch": 1.2192622950819672,
176
- "grad_norm": 0.22596795856952667,
177
- "learning_rate": 2.938496583143508e-05,
178
- "loss": 1.5731,
179
- "step": 230
180
- },
181
- {
182
- "epoch": 1.2397540983606556,
183
- "grad_norm": 43.027931213378906,
184
- "learning_rate": 2.824601366742597e-05,
185
- "loss": 1.0259,
186
- "step": 240
187
- },
188
- {
189
- "epoch": 1.2520491803278688,
190
- "eval_accuracy": 0.6595744680851063,
191
- "eval_loss": 1.1473325490951538,
192
- "eval_runtime": 3.5233,
193
- "eval_samples_per_second": 13.34,
194
- "eval_steps_per_second": 6.812,
195
- "step": 246
196
- },
197
- {
198
- "epoch": 2.0081967213114753,
199
- "grad_norm": 16.573293685913086,
200
- "learning_rate": 2.7107061503416858e-05,
201
- "loss": 0.8229,
202
- "step": 250
203
- },
204
- {
205
- "epoch": 2.028688524590164,
206
- "grad_norm": 34.50025177001953,
207
- "learning_rate": 2.596810933940775e-05,
208
- "loss": 1.2741,
209
- "step": 260
210
- },
211
- {
212
- "epoch": 2.0491803278688523,
213
- "grad_norm": 16.234542846679688,
214
- "learning_rate": 2.4829157175398634e-05,
215
- "loss": 0.8029,
216
- "step": 270
217
- },
218
- {
219
- "epoch": 2.069672131147541,
220
- "grad_norm": 36.11598587036133,
221
- "learning_rate": 2.3690205011389523e-05,
222
- "loss": 0.4739,
223
- "step": 280
224
- },
225
- {
226
- "epoch": 2.0901639344262297,
227
- "grad_norm": 53.0654182434082,
228
- "learning_rate": 2.255125284738041e-05,
229
- "loss": 0.9375,
230
- "step": 290
231
- },
232
- {
233
- "epoch": 2.110655737704918,
234
- "grad_norm": 27.09005355834961,
235
- "learning_rate": 2.14123006833713e-05,
236
- "loss": 0.5147,
237
- "step": 300
238
- },
239
- {
240
- "epoch": 2.1311475409836067,
241
- "grad_norm": 1.1381382942199707,
242
- "learning_rate": 2.0273348519362188e-05,
243
- "loss": 0.3669,
244
- "step": 310
245
- },
246
- {
247
- "epoch": 2.151639344262295,
248
- "grad_norm": 33.40491485595703,
249
- "learning_rate": 1.9134396355353076e-05,
250
- "loss": 0.7359,
251
- "step": 320
252
- },
253
- {
254
- "epoch": 2.1721311475409837,
255
- "grad_norm": 39.87897491455078,
256
- "learning_rate": 1.7995444191343964e-05,
257
- "loss": 0.8056,
258
- "step": 330
259
- },
260
- {
261
- "epoch": 2.192622950819672,
262
- "grad_norm": 0.3967530131340027,
263
- "learning_rate": 1.6856492027334853e-05,
264
- "loss": 0.6106,
265
- "step": 340
266
- },
267
- {
268
- "epoch": 2.2131147540983607,
269
- "grad_norm": 15.328410148620605,
270
- "learning_rate": 1.571753986332574e-05,
271
- "loss": 0.5864,
272
- "step": 350
273
- },
274
- {
275
- "epoch": 2.2336065573770494,
276
- "grad_norm": 0.5930748581886292,
277
- "learning_rate": 1.457858769931663e-05,
278
- "loss": 0.3236,
279
- "step": 360
280
- },
281
- {
282
- "epoch": 2.2520491803278686,
283
- "eval_accuracy": 0.6808510638297872,
284
- "eval_loss": 1.138521432876587,
285
- "eval_runtime": 3.5551,
286
- "eval_samples_per_second": 13.221,
287
- "eval_steps_per_second": 6.751,
288
- "step": 369
289
- },
290
- {
291
- "epoch": 3.002049180327869,
292
- "grad_norm": 0.42666512727737427,
293
- "learning_rate": 1.3439635535307518e-05,
294
- "loss": 0.6331,
295
- "step": 370
296
- },
297
- {
298
- "epoch": 3.0225409836065573,
299
- "grad_norm": 0.0817425474524498,
300
- "learning_rate": 1.2300683371298406e-05,
301
- "loss": 0.5621,
302
- "step": 380
303
- },
304
- {
305
- "epoch": 3.043032786885246,
306
- "grad_norm": 0.2686825692653656,
307
- "learning_rate": 1.1161731207289294e-05,
308
- "loss": 0.2522,
309
- "step": 390
310
- },
311
- {
312
- "epoch": 3.0635245901639343,
313
- "grad_norm": 0.08851628750562668,
314
- "learning_rate": 1.0022779043280183e-05,
315
- "loss": 0.7662,
316
- "step": 400
317
- },
318
- {
319
- "epoch": 3.084016393442623,
320
- "grad_norm": 0.9150404334068298,
321
- "learning_rate": 8.883826879271071e-06,
322
- "loss": 1.204,
323
- "step": 410
324
- },
325
- {
326
- "epoch": 3.1045081967213113,
327
- "grad_norm": 1.546443223953247,
328
- "learning_rate": 7.74487471526196e-06,
329
- "loss": 0.8539,
330
- "step": 420
331
- },
332
- {
333
- "epoch": 3.125,
334
- "grad_norm": 5.276226997375488,
335
- "learning_rate": 6.605922551252848e-06,
336
- "loss": 0.2554,
337
- "step": 430
338
- },
339
- {
340
- "epoch": 3.1454918032786887,
341
- "grad_norm": 0.19730453193187714,
342
- "learning_rate": 5.466970387243736e-06,
343
- "loss": 0.2582,
344
- "step": 440
345
- },
346
- {
347
- "epoch": 3.165983606557377,
348
- "grad_norm": 2.347675085067749,
349
- "learning_rate": 4.328018223234624e-06,
350
- "loss": 0.4179,
351
- "step": 450
352
- },
353
- {
354
- "epoch": 3.1864754098360657,
355
- "grad_norm": 0.2406870424747467,
356
- "learning_rate": 3.189066059225513e-06,
357
- "loss": 0.2018,
358
- "step": 460
359
- },
360
- {
361
- "epoch": 3.206967213114754,
362
- "grad_norm": 0.8780645728111267,
363
- "learning_rate": 2.050113895216401e-06,
364
- "loss": 0.2272,
365
- "step": 470
366
- },
367
- {
368
- "epoch": 3.2274590163934427,
369
- "grad_norm": 0.222975954413414,
370
- "learning_rate": 9.111617312072893e-07,
371
- "loss": 0.5371,
372
- "step": 480
373
- },
374
- {
375
- "epoch": 3.2438524590163933,
376
- "eval_accuracy": 0.7021276595744681,
377
- "eval_loss": 1.0504409074783325,
378
- "eval_runtime": 4.132,
379
- "eval_samples_per_second": 11.375,
380
- "eval_steps_per_second": 5.808,
381
- "step": 488
382
- },
383
- {
384
- "epoch": 3.2438524590163933,
385
- "step": 488,
386
- "total_flos": 1.2124749082531922e+18,
387
- "train_loss": 0.8016270340466108,
388
- "train_runtime": 367.025,
389
- "train_samples_per_second": 2.659,
390
- "train_steps_per_second": 1.33
391
  },
392
  {
393
- "epoch": 3.2438524590163933,
394
- "eval_accuracy": 0.7647058823529411,
395
- "eval_loss": 0.8334440588951111,
396
- "eval_runtime": 7.8397,
397
- "eval_samples_per_second": 13.011,
398
- "eval_steps_per_second": 6.505,
399
- "step": 488
400
  },
401
  {
402
- "epoch": 3.2438524590163933,
403
- "eval_accuracy": 0.7647058823529411,
404
- "eval_loss": 0.8334438800811768,
405
- "eval_runtime": 7.7031,
406
- "eval_samples_per_second": 13.241,
407
- "eval_steps_per_second": 6.621,
408
- "step": 488
409
  }
410
  ],
411
  "logging_steps": 10,
412
- "max_steps": 488,
413
  "num_input_tokens_seen": 0,
414
  "num_train_epochs": 9223372036854775807,
415
  "save_steps": 500,
@@ -420,13 +192,13 @@
420
  "should_evaluate": false,
421
  "should_log": false,
422
  "should_save": true,
423
- "should_training_stop": true
424
  },
425
  "attributes": {}
426
  }
427
  },
428
- "total_flos": 1.2124749082531922e+18,
429
- "train_batch_size": 2,
430
  "trial_name": null,
431
  "trial_params": null
432
  }
 
1
  {
2
+ "best_metric": 0.5957446808510638,
3
+ "best_model_checkpoint": "videomae-base-finetuned-ucf101-subset/checkpoint-124",
4
+ "epoch": 2.2540983606557377,
5
  "eval_steps": 500,
6
+ "global_step": 186,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.040983606557377046,
13
+ "grad_norm": 14.630450248718262,
14
+ "learning_rate": 2e-05,
15
+ "loss": 1.9953,
16
  "step": 10
17
  },
18
  {
19
+ "epoch": 0.08196721311475409,
20
+ "grad_norm": 12.040234565734863,
21
+ "learning_rate": 4e-05,
22
+ "loss": 2.0122,
23
  "step": 20
24
  },
25
  {
26
+ "epoch": 0.12295081967213115,
27
+ "grad_norm": 10.06123161315918,
28
+ "learning_rate": 4.8858447488584476e-05,
29
+ "loss": 1.9064,
30
  "step": 30
31
  },
32
  {
33
+ "epoch": 0.16393442622950818,
34
+ "grad_norm": 9.154711723327637,
35
+ "learning_rate": 4.657534246575342e-05,
36
+ "loss": 1.955,
37
  "step": 40
38
  },
39
  {
40
+ "epoch": 0.20491803278688525,
41
+ "grad_norm": 17.53380012512207,
42
+ "learning_rate": 4.4292237442922375e-05,
43
+ "loss": 1.8111,
44
  "step": 50
45
  },
46
  {
47
+ "epoch": 0.2459016393442623,
48
+ "grad_norm": 11.089496612548828,
49
+ "learning_rate": 4.200913242009132e-05,
50
+ "loss": 1.8106,
51
  "step": 60
52
  },
53
  {
54
+ "epoch": 0.2540983606557377,
55
+ "eval_accuracy": 0.19148936170212766,
56
+ "eval_loss": 1.8704100847244263,
57
+ "eval_runtime": 3.5011,
58
+ "eval_samples_per_second": 13.424,
59
+ "eval_steps_per_second": 3.428,
60
+ "step": 62
61
+ },
62
+ {
63
+ "epoch": 1.0327868852459017,
64
+ "grad_norm": 13.336834907531738,
65
+ "learning_rate": 3.9726027397260274e-05,
66
+ "loss": 1.8751,
67
  "step": 70
68
  },
69
  {
70
+ "epoch": 1.0737704918032787,
71
+ "grad_norm": 11.175029754638672,
72
+ "learning_rate": 3.744292237442922e-05,
73
+ "loss": 1.6123,
74
  "step": 80
75
  },
76
  {
77
+ "epoch": 1.1147540983606556,
78
+ "grad_norm": 10.622461318969727,
79
+ "learning_rate": 3.5159817351598174e-05,
80
+ "loss": 1.8106,
81
  "step": 90
82
  },
83
  {
84
+ "epoch": 1.1557377049180328,
85
+ "grad_norm": 9.679147720336914,
86
+ "learning_rate": 3.287671232876712e-05,
87
+ "loss": 1.567,
88
  "step": 100
89
  },
90
  {
91
+ "epoch": 1.1967213114754098,
92
+ "grad_norm": 14.767767906188965,
93
+ "learning_rate": 3.059360730593607e-05,
94
+ "loss": 1.5578,
95
  "step": 110
96
  },
97
  {
98
+ "epoch": 1.2377049180327868,
99
+ "grad_norm": 18.987808227539062,
100
+ "learning_rate": 2.8310502283105023e-05,
101
+ "loss": 1.4825,
102
  "step": 120
103
  },
104
  {
105
+ "epoch": 1.2540983606557377,
106
+ "eval_accuracy": 0.5957446808510638,
107
+ "eval_loss": 1.370785117149353,
108
+ "eval_runtime": 3.3745,
109
+ "eval_samples_per_second": 13.928,
110
+ "eval_steps_per_second": 3.556,
111
+ "step": 124
112
  },
113
  {
114
+ "epoch": 2.0245901639344264,
115
+ "grad_norm": 19.232662200927734,
116
+ "learning_rate": 2.6027397260273973e-05,
117
+ "loss": 1.196,
118
  "step": 130
119
  },
120
  {
121
+ "epoch": 2.0655737704918034,
122
+ "grad_norm": 23.459028244018555,
123
+ "learning_rate": 2.3744292237442922e-05,
124
+ "loss": 1.0483,
125
  "step": 140
126
  },
127
  {
128
+ "epoch": 2.1065573770491803,
129
+ "grad_norm": 15.685453414916992,
130
+ "learning_rate": 2.1461187214611872e-05,
131
+ "loss": 1.0462,
132
  "step": 150
133
  },
134
  {
135
+ "epoch": 2.1475409836065573,
136
+ "grad_norm": 16.980884552001953,
137
+ "learning_rate": 1.9178082191780822e-05,
138
+ "loss": 1.1794,
139
  "step": 160
140
  },
141
  {
142
+ "epoch": 2.1885245901639343,
143
+ "grad_norm": 20.012128829956055,
144
+ "learning_rate": 1.689497716894977e-05,
145
+ "loss": 0.8242,
146
  "step": 170
147
  },
148
  {
149
+ "epoch": 2.2295081967213113,
150
+ "grad_norm": 12.054617881774902,
151
+ "learning_rate": 1.4611872146118721e-05,
152
+ "loss": 0.872,
153
  "step": 180
154
  },
155
  {
156
+ "epoch": 2.2540983606557377,
157
+ "eval_accuracy": 0.5319148936170213,
158
+ "eval_loss": 1.0101068019866943,
159
+ "eval_runtime": 3.379,
160
+ "eval_samples_per_second": 13.91,
161
+ "eval_steps_per_second": 3.551,
162
+ "step": 186
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
163
  },
164
  {
165
+ "epoch": 2.2540983606557377,
166
+ "eval_accuracy": 0.7058823529411765,
167
+ "eval_loss": 0.9551948308944702,
168
+ "eval_runtime": 7.648,
169
+ "eval_samples_per_second": 13.337,
170
+ "eval_steps_per_second": 3.4,
171
+ "step": 186
172
  },
173
  {
174
+ "epoch": 2.2540983606557377,
175
+ "eval_accuracy": 0.7058823529411765,
176
+ "eval_loss": 0.9551951289176941,
177
+ "eval_runtime": 7.5849,
178
+ "eval_samples_per_second": 13.448,
179
+ "eval_steps_per_second": 3.428,
180
+ "step": 186
181
  }
182
  ],
183
  "logging_steps": 10,
184
+ "max_steps": 244,
185
  "num_input_tokens_seen": 0,
186
  "num_train_epochs": 9223372036854775807,
187
  "save_steps": 500,
 
192
  "should_evaluate": false,
193
  "should_log": false,
194
  "should_save": true,
195
+ "should_training_stop": false
196
  },
197
  "attributes": {}
198
  }
199
  },
200
+ "total_flos": 9.158983119898214e+17,
201
+ "train_batch_size": 4,
202
  "trial_name": null,
203
  "trial_params": null
204
  }